ixgbe.c revision 1.14.2.6 1 1.1 dyoung /******************************************************************************
2 1.1 dyoung
3 1.14.2.5 riz Copyright (c) 2001-2013, Intel Corporation
4 1.1 dyoung All rights reserved.
5 1.1 dyoung
6 1.1 dyoung Redistribution and use in source and binary forms, with or without
7 1.1 dyoung modification, are permitted provided that the following conditions are met:
8 1.1 dyoung
9 1.1 dyoung 1. Redistributions of source code must retain the above copyright notice,
10 1.1 dyoung this list of conditions and the following disclaimer.
11 1.1 dyoung
12 1.1 dyoung 2. Redistributions in binary form must reproduce the above copyright
13 1.1 dyoung notice, this list of conditions and the following disclaimer in the
14 1.1 dyoung documentation and/or other materials provided with the distribution.
15 1.1 dyoung
16 1.1 dyoung 3. Neither the name of the Intel Corporation nor the names of its
17 1.1 dyoung contributors may be used to endorse or promote products derived from
18 1.1 dyoung this software without specific prior written permission.
19 1.1 dyoung
20 1.1 dyoung THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
21 1.1 dyoung AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
22 1.1 dyoung IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
23 1.1 dyoung ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
24 1.1 dyoung LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
25 1.1 dyoung CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
26 1.1 dyoung SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
27 1.1 dyoung INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
28 1.1 dyoung CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
29 1.1 dyoung ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
30 1.1 dyoung POSSIBILITY OF SUCH DAMAGE.
31 1.1 dyoung
32 1.1 dyoung ******************************************************************************/
33 1.1 dyoung /*
34 1.1 dyoung * Copyright (c) 2011 The NetBSD Foundation, Inc.
35 1.1 dyoung * All rights reserved.
36 1.1 dyoung *
37 1.1 dyoung * This code is derived from software contributed to The NetBSD Foundation
38 1.1 dyoung * by Coyote Point Systems, Inc.
39 1.1 dyoung *
40 1.1 dyoung * Redistribution and use in source and binary forms, with or without
41 1.1 dyoung * modification, are permitted provided that the following conditions
42 1.1 dyoung * are met:
43 1.1 dyoung * 1. Redistributions of source code must retain the above copyright
44 1.1 dyoung * notice, this list of conditions and the following disclaimer.
45 1.1 dyoung * 2. Redistributions in binary form must reproduce the above copyright
46 1.1 dyoung * notice, this list of conditions and the following disclaimer in the
47 1.1 dyoung * documentation and/or other materials provided with the distribution.
48 1.1 dyoung *
49 1.1 dyoung * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
50 1.1 dyoung * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
51 1.1 dyoung * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
52 1.1 dyoung * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
53 1.1 dyoung * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
54 1.1 dyoung * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
55 1.1 dyoung * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
56 1.1 dyoung * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
57 1.1 dyoung * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
58 1.1 dyoung * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
59 1.1 dyoung * POSSIBILITY OF SUCH DAMAGE.
60 1.1 dyoung */
61 1.14.2.6 snj /*$FreeBSD: head/sys/dev/ixgbe/ixgbe.c 279805 2015-03-09 10:29:15Z araujo $*/
62 1.14.2.6 snj /*$NetBSD: ixgbe.c,v 1.14.2.6 2016/06/14 08:42:34 snj Exp $*/
63 1.1 dyoung
64 1.1 dyoung #include "opt_inet.h"
65 1.14.2.3 martin #include "opt_inet6.h"
66 1.1 dyoung
67 1.1 dyoung #include "ixgbe.h"
68 1.14.2.5 riz #include "vlan.h"
69 1.1 dyoung
70 1.14.2.6 snj #include <sys/cprng.h>
71 1.14.2.6 snj
72 1.1 dyoung /*********************************************************************
73 1.1 dyoung * Set this to one to display debug statistics
74 1.1 dyoung *********************************************************************/
75 1.1 dyoung int ixgbe_display_debug_stats = 0;
76 1.1 dyoung
77 1.1 dyoung /*********************************************************************
78 1.1 dyoung * Driver version
79 1.1 dyoung *********************************************************************/
80 1.14.2.6 snj char ixgbe_driver_version[] = "2.5.15";
81 1.1 dyoung
82 1.1 dyoung /*********************************************************************
83 1.1 dyoung * PCI Device ID Table
84 1.1 dyoung *
85 1.1 dyoung * Used by probe to select devices to load on
86 1.1 dyoung * Last field stores an index into ixgbe_strings
87 1.1 dyoung * Last entry must be all 0s
88 1.1 dyoung *
89 1.1 dyoung * { Vendor ID, Device ID, SubVendor ID, SubDevice ID, String Index }
90 1.1 dyoung *********************************************************************/
91 1.1 dyoung
92 1.1 dyoung static ixgbe_vendor_info_t ixgbe_vendor_info_array[] =
93 1.1 dyoung {
94 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82598AF_DUAL_PORT, 0, 0, 0},
95 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82598AF_SINGLE_PORT, 0, 0, 0},
96 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82598EB_CX4, 0, 0, 0},
97 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82598AT, 0, 0, 0},
98 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82598AT2, 0, 0, 0},
99 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82598, 0, 0, 0},
100 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82598_DA_DUAL_PORT, 0, 0, 0},
101 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82598_CX4_DUAL_PORT, 0, 0, 0},
102 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82598EB_XF_LR, 0, 0, 0},
103 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82598_SR_DUAL_PORT_EM, 0, 0, 0},
104 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82598EB_SFP_LOM, 0, 0, 0},
105 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599_KX4, 0, 0, 0},
106 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599_KX4_MEZZ, 0, 0, 0},
107 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599_SFP, 0, 0, 0},
108 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599_XAUI_LOM, 0, 0, 0},
109 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599_CX4, 0, 0, 0},
110 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599_T3_LOM, 0, 0, 0},
111 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599_COMBO_BACKPLANE, 0, 0, 0},
112 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599_BACKPLANE_FCOE, 0, 0, 0},
113 1.14.2.3 martin {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599_SFP_SF2, 0, 0, 0},
114 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599_SFP_FCOE, 0, 0, 0},
115 1.14.2.3 martin {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599EN_SFP, 0, 0, 0},
116 1.14.2.3 martin {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599_SFP_SF_QP, 0, 0, 0},
117 1.14.2.4 riz {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_X540T, 0, 0, 0},
118 1.1 dyoung /* required last entry */
119 1.1 dyoung {0, 0, 0, 0, 0}
120 1.1 dyoung };
121 1.1 dyoung
122 1.1 dyoung /*********************************************************************
123 1.1 dyoung * Table of branding strings
124 1.1 dyoung *********************************************************************/
125 1.1 dyoung
126 1.1 dyoung static const char *ixgbe_strings[] = {
127 1.1 dyoung "Intel(R) PRO/10GbE PCI-Express Network Driver"
128 1.1 dyoung };
129 1.1 dyoung
130 1.1 dyoung /*********************************************************************
131 1.1 dyoung * Function prototypes
132 1.1 dyoung *********************************************************************/
133 1.1 dyoung static int ixgbe_probe(device_t, cfdata_t, void *);
134 1.1 dyoung static void ixgbe_attach(device_t, device_t, void *);
135 1.1 dyoung static int ixgbe_detach(device_t, int);
136 1.1 dyoung #if 0
137 1.1 dyoung static int ixgbe_shutdown(device_t);
138 1.1 dyoung #endif
139 1.14.2.6 snj #ifdef IXGBE_LEGACY_TX
140 1.14.2.5 riz static void ixgbe_start(struct ifnet *);
141 1.14.2.5 riz static void ixgbe_start_locked(struct tx_ring *, struct ifnet *);
142 1.14.2.6 snj #else /* ! IXGBE_LEGACY_TX */
143 1.1 dyoung static int ixgbe_mq_start(struct ifnet *, struct mbuf *);
144 1.14.2.6 snj static int ixgbe_mq_start_locked(struct ifnet *, struct tx_ring *);
145 1.1 dyoung static void ixgbe_qflush(struct ifnet *);
146 1.14.2.6 snj static void ixgbe_deferred_mq_start(void *, int);
147 1.14.2.6 snj #endif /* IXGBE_LEGACY_TX */
148 1.1 dyoung static int ixgbe_ioctl(struct ifnet *, u_long, void *);
149 1.1 dyoung static void ixgbe_ifstop(struct ifnet *, int);
150 1.1 dyoung static int ixgbe_init(struct ifnet *);
151 1.1 dyoung static void ixgbe_init_locked(struct adapter *);
152 1.1 dyoung static void ixgbe_stop(void *);
153 1.1 dyoung static void ixgbe_media_status(struct ifnet *, struct ifmediareq *);
154 1.1 dyoung static int ixgbe_media_change(struct ifnet *);
155 1.1 dyoung static void ixgbe_identify_hardware(struct adapter *);
156 1.1 dyoung static int ixgbe_allocate_pci_resources(struct adapter *,
157 1.1 dyoung const struct pci_attach_args *);
158 1.14.2.6 snj static void ixgbe_get_slot_info(struct ixgbe_hw *);
159 1.1 dyoung static int ixgbe_allocate_msix(struct adapter *,
160 1.1 dyoung const struct pci_attach_args *);
161 1.1 dyoung static int ixgbe_allocate_legacy(struct adapter *,
162 1.1 dyoung const struct pci_attach_args *);
163 1.1 dyoung static int ixgbe_allocate_queues(struct adapter *);
164 1.1 dyoung static int ixgbe_setup_msix(struct adapter *);
165 1.1 dyoung static void ixgbe_free_pci_resources(struct adapter *);
166 1.1 dyoung static void ixgbe_local_timer(void *);
167 1.1 dyoung static int ixgbe_setup_interface(device_t, struct adapter *);
168 1.1 dyoung static void ixgbe_config_link(struct adapter *);
169 1.1 dyoung
170 1.1 dyoung static int ixgbe_allocate_transmit_buffers(struct tx_ring *);
171 1.1 dyoung static int ixgbe_setup_transmit_structures(struct adapter *);
172 1.1 dyoung static void ixgbe_setup_transmit_ring(struct tx_ring *);
173 1.1 dyoung static void ixgbe_initialize_transmit_units(struct adapter *);
174 1.1 dyoung static void ixgbe_free_transmit_structures(struct adapter *);
175 1.1 dyoung static void ixgbe_free_transmit_buffers(struct tx_ring *);
176 1.1 dyoung
177 1.1 dyoung static int ixgbe_allocate_receive_buffers(struct rx_ring *);
178 1.1 dyoung static int ixgbe_setup_receive_structures(struct adapter *);
179 1.1 dyoung static int ixgbe_setup_receive_ring(struct rx_ring *);
180 1.1 dyoung static void ixgbe_initialize_receive_units(struct adapter *);
181 1.1 dyoung static void ixgbe_free_receive_structures(struct adapter *);
182 1.1 dyoung static void ixgbe_free_receive_buffers(struct rx_ring *);
183 1.1 dyoung static void ixgbe_setup_hw_rsc(struct rx_ring *);
184 1.1 dyoung
185 1.1 dyoung static void ixgbe_enable_intr(struct adapter *);
186 1.1 dyoung static void ixgbe_disable_intr(struct adapter *);
187 1.1 dyoung static void ixgbe_update_stats_counters(struct adapter *);
188 1.14.2.6 snj static void ixgbe_txeof(struct tx_ring *);
189 1.14.2.5 riz static bool ixgbe_rxeof(struct ix_queue *);
190 1.1 dyoung static void ixgbe_rx_checksum(u32, struct mbuf *, u32,
191 1.1 dyoung struct ixgbe_hw_stats *);
192 1.1 dyoung static void ixgbe_set_promisc(struct adapter *);
193 1.1 dyoung static void ixgbe_set_multi(struct adapter *);
194 1.1 dyoung static void ixgbe_update_link_status(struct adapter *);
195 1.1 dyoung static void ixgbe_refresh_mbufs(struct rx_ring *, int);
196 1.1 dyoung static int ixgbe_xmit(struct tx_ring *, struct mbuf *);
197 1.1 dyoung static int ixgbe_set_flowcntl(SYSCTLFN_PROTO);
198 1.1 dyoung static int ixgbe_set_advertise(SYSCTLFN_PROTO);
199 1.14.2.4 riz static int ixgbe_set_thermal_test(SYSCTLFN_PROTO);
200 1.1 dyoung static int ixgbe_dma_malloc(struct adapter *, bus_size_t,
201 1.1 dyoung struct ixgbe_dma_alloc *, int);
202 1.1 dyoung static void ixgbe_dma_free(struct adapter *, struct ixgbe_dma_alloc *);
203 1.14.2.5 riz static int ixgbe_tx_ctx_setup(struct tx_ring *,
204 1.14.2.5 riz struct mbuf *, u32 *, u32 *);
205 1.14.2.5 riz static int ixgbe_tso_setup(struct tx_ring *,
206 1.14.2.5 riz struct mbuf *, u32 *, u32 *);
207 1.1 dyoung static void ixgbe_set_ivar(struct adapter *, u8, u8, s8);
208 1.1 dyoung static void ixgbe_configure_ivars(struct adapter *);
209 1.1 dyoung static u8 * ixgbe_mc_array_itr(struct ixgbe_hw *, u8 **, u32 *);
210 1.1 dyoung
211 1.1 dyoung static void ixgbe_setup_vlan_hw_support(struct adapter *);
212 1.1 dyoung #if 0
213 1.1 dyoung static void ixgbe_register_vlan(void *, struct ifnet *, u16);
214 1.1 dyoung static void ixgbe_unregister_vlan(void *, struct ifnet *, u16);
215 1.1 dyoung #endif
216 1.1 dyoung
217 1.1 dyoung static void ixgbe_add_hw_stats(struct adapter *adapter);
218 1.1 dyoung
219 1.1 dyoung static __inline void ixgbe_rx_discard(struct rx_ring *, int);
220 1.1 dyoung static __inline void ixgbe_rx_input(struct rx_ring *, struct ifnet *,
221 1.1 dyoung struct mbuf *, u32);
222 1.1 dyoung
223 1.14.2.4 riz static void ixgbe_enable_rx_drop(struct adapter *);
224 1.14.2.4 riz static void ixgbe_disable_rx_drop(struct adapter *);
225 1.14.2.4 riz
226 1.1 dyoung /* Support for pluggable optic modules */
227 1.1 dyoung static bool ixgbe_sfp_probe(struct adapter *);
228 1.1 dyoung static void ixgbe_setup_optics(struct adapter *);
229 1.1 dyoung
230 1.1 dyoung /* Legacy (single vector interrupt handler */
231 1.1 dyoung static int ixgbe_legacy_irq(void *);
232 1.1 dyoung
233 1.1 dyoung #if defined(NETBSD_MSI_OR_MSIX)
234 1.1 dyoung /* The MSI/X Interrupt handlers */
235 1.1 dyoung static void ixgbe_msix_que(void *);
236 1.1 dyoung static void ixgbe_msix_link(void *);
237 1.1 dyoung #endif
238 1.1 dyoung
239 1.1 dyoung /* Software interrupts for deferred work */
240 1.1 dyoung static void ixgbe_handle_que(void *);
241 1.1 dyoung static void ixgbe_handle_link(void *);
242 1.1 dyoung static void ixgbe_handle_msf(void *);
243 1.1 dyoung static void ixgbe_handle_mod(void *);
244 1.1 dyoung
245 1.1 dyoung const struct sysctlnode *ixgbe_sysctl_instance(struct adapter *);
246 1.1 dyoung static ixgbe_vendor_info_t *ixgbe_lookup(const struct pci_attach_args *);
247 1.1 dyoung
248 1.1 dyoung #ifdef IXGBE_FDIR
249 1.1 dyoung static void ixgbe_atr(struct tx_ring *, struct mbuf *);
250 1.1 dyoung static void ixgbe_reinit_fdir(void *, int);
251 1.1 dyoung #endif
252 1.1 dyoung
253 1.14.2.6 snj /* Missing shared code prototype */
254 1.14.2.6 snj extern void ixgbe_stop_mac_link_on_d3_82599(struct ixgbe_hw *hw);
255 1.14.2.6 snj
256 1.1 dyoung /*********************************************************************
257 1.1 dyoung * FreeBSD Device Interface Entry Points
258 1.1 dyoung *********************************************************************/
259 1.1 dyoung
260 1.1 dyoung CFATTACH_DECL3_NEW(ixg, sizeof(struct adapter),
261 1.1 dyoung ixgbe_probe, ixgbe_attach, ixgbe_detach, NULL, NULL, NULL,
262 1.1 dyoung DVF_DETACH_SHUTDOWN);
263 1.1 dyoung
264 1.1 dyoung #if 0
265 1.1 dyoung devclass_t ixgbe_devclass;
266 1.1 dyoung DRIVER_MODULE(ixgbe, pci, ixgbe_driver, ixgbe_devclass, 0, 0);
267 1.1 dyoung
268 1.1 dyoung MODULE_DEPEND(ixgbe, pci, 1, 1, 1);
269 1.1 dyoung MODULE_DEPEND(ixgbe, ether, 1, 1, 1);
270 1.1 dyoung #endif
271 1.1 dyoung
272 1.1 dyoung /*
273 1.1 dyoung ** TUNEABLE PARAMETERS:
274 1.1 dyoung */
275 1.1 dyoung
276 1.1 dyoung /*
277 1.1 dyoung ** AIM: Adaptive Interrupt Moderation
278 1.1 dyoung ** which means that the interrupt rate
279 1.1 dyoung ** is varied over time based on the
280 1.1 dyoung ** traffic for that interrupt vector
281 1.1 dyoung */
282 1.1 dyoung static int ixgbe_enable_aim = TRUE;
283 1.14.2.6 snj #define SYSCTL_INT(__x, __y)
284 1.14.2.6 snj SYSCTL_INT("hw.ixgbe.enable_aim", &ixgbe_enable_aim);
285 1.1 dyoung
286 1.14.2.3 martin static int ixgbe_max_interrupt_rate = (4000000 / IXGBE_LOW_LATENCY);
287 1.14.2.6 snj SYSCTL_INT("hw.ixgbe.max_interrupt_rate", &ixgbe_max_interrupt_rate);
288 1.1 dyoung
289 1.1 dyoung /* How many packets rxeof tries to clean at a time */
290 1.1 dyoung static int ixgbe_rx_process_limit = 256;
291 1.14.2.6 snj SYSCTL_INT("hw.ixgbe.rx_process_limit", &ixgbe_rx_process_limit);
292 1.1 dyoung
293 1.14.2.5 riz /* How many packets txeof tries to clean at a time */
294 1.14.2.5 riz static int ixgbe_tx_process_limit = 256;
295 1.14.2.6 snj SYSCTL_INT("hw.ixgbe.tx_process_limit", &ixgbe_tx_process_limit);
296 1.14.2.5 riz
297 1.1 dyoung /*
298 1.1 dyoung ** Smart speed setting, default to on
299 1.1 dyoung ** this only works as a compile option
300 1.1 dyoung ** right now as its during attach, set
301 1.1 dyoung ** this to 'ixgbe_smart_speed_off' to
302 1.1 dyoung ** disable.
303 1.1 dyoung */
304 1.1 dyoung static int ixgbe_smart_speed = ixgbe_smart_speed_on;
305 1.1 dyoung
306 1.1 dyoung /*
307 1.1 dyoung * MSIX should be the default for best performance,
308 1.1 dyoung * but this allows it to be forced off for testing.
309 1.1 dyoung */
310 1.1 dyoung static int ixgbe_enable_msix = 1;
311 1.14.2.6 snj SYSCTL_INT("hw.ixgbe.enable_msix", &ixgbe_enable_msix);
312 1.1 dyoung
313 1.1 dyoung #if defined(NETBSD_MSI_OR_MSIX)
314 1.1 dyoung /*
315 1.1 dyoung * Number of Queues, can be set to 0,
316 1.1 dyoung * it then autoconfigures based on the
317 1.1 dyoung * number of cpus with a max of 8. This
318 1.1 dyoung * can be overriden manually here.
319 1.1 dyoung */
320 1.1 dyoung static int ixgbe_num_queues = 0;
321 1.14.2.6 snj SYSCTL_INT("hw.ixgbe.num_queues", &ixgbe_num_queues);
322 1.1 dyoung #endif
323 1.1 dyoung
324 1.1 dyoung /*
325 1.1 dyoung ** Number of TX descriptors per ring,
326 1.1 dyoung ** setting higher than RX as this seems
327 1.1 dyoung ** the better performing choice.
328 1.1 dyoung */
329 1.1 dyoung static int ixgbe_txd = PERFORM_TXD;
330 1.14.2.6 snj SYSCTL_INT("hw.ixgbe.txd", &ixgbe_txd);
331 1.1 dyoung
332 1.1 dyoung /* Number of RX descriptors per ring */
333 1.1 dyoung static int ixgbe_rxd = PERFORM_RXD;
334 1.14.2.6 snj SYSCTL_INT("hw.ixgbe.rxd", &ixgbe_rxd);
335 1.14.2.6 snj
336 1.14.2.6 snj /*
337 1.14.2.6 snj ** Defining this on will allow the use
338 1.14.2.6 snj ** of unsupported SFP+ modules, note that
339 1.14.2.6 snj ** doing so you are on your own :)
340 1.14.2.6 snj */
341 1.14.2.6 snj static int allow_unsupported_sfp = false;
342 1.14.2.6 snj SYSCTL_INT("hw.ix.unsupported_sfp", &allow_unsupported_sfp);
343 1.1 dyoung
344 1.14.2.4 riz /*
345 1.14.2.4 riz ** HW RSC control:
346 1.14.2.4 riz ** this feature only works with
347 1.14.2.4 riz ** IPv4, and only on 82599 and later.
348 1.14.2.4 riz ** Also this will cause IP forwarding to
349 1.14.2.4 riz ** fail and that can't be controlled by
350 1.14.2.4 riz ** the stack as LRO can. For all these
351 1.14.2.4 riz ** reasons I've deemed it best to leave
352 1.14.2.4 riz ** this off and not bother with a tuneable
353 1.14.2.4 riz ** interface, this would need to be compiled
354 1.14.2.4 riz ** to enable.
355 1.14.2.4 riz */
356 1.14.2.4 riz static bool ixgbe_rsc_enable = FALSE;
357 1.14.2.4 riz
358 1.1 dyoung /* Keep running tab on them for sanity check */
359 1.1 dyoung static int ixgbe_total_ports;
360 1.1 dyoung
361 1.1 dyoung #ifdef IXGBE_FDIR
362 1.1 dyoung /*
363 1.1 dyoung ** For Flow Director: this is the
364 1.1 dyoung ** number of TX packets we sample
365 1.1 dyoung ** for the filter pool, this means
366 1.1 dyoung ** every 20th packet will be probed.
367 1.1 dyoung **
368 1.1 dyoung ** This feature can be disabled by
369 1.1 dyoung ** setting this to 0.
370 1.1 dyoung */
371 1.1 dyoung static int atr_sample_rate = 20;
372 1.1 dyoung /*
373 1.1 dyoung ** Flow Director actually 'steals'
374 1.1 dyoung ** part of the packet buffer as its
375 1.1 dyoung ** filter pool, this variable controls
376 1.1 dyoung ** how much it uses:
377 1.1 dyoung ** 0 = 64K, 1 = 128K, 2 = 256K
378 1.1 dyoung */
379 1.1 dyoung static int fdir_pballoc = 1;
380 1.1 dyoung #endif
381 1.1 dyoung
382 1.14.2.3 martin #ifdef DEV_NETMAP
383 1.14.2.3 martin /*
384 1.14.2.3 martin * The #ifdef DEV_NETMAP / #endif blocks in this file are meant to
385 1.14.2.3 martin * be a reference on how to implement netmap support in a driver.
386 1.14.2.3 martin * Additional comments are in ixgbe_netmap.h .
387 1.14.2.3 martin *
388 1.14.2.4 riz * <dev/netmap/ixgbe_netmap.h> contains functions for netmap support
389 1.14.2.3 martin * that extend the standard driver.
390 1.14.2.3 martin */
391 1.14.2.3 martin #include <dev/netmap/ixgbe_netmap.h>
392 1.14.2.3 martin #endif /* DEV_NETMAP */
393 1.14.2.3 martin
394 1.1 dyoung /*********************************************************************
395 1.1 dyoung * Device identification routine
396 1.1 dyoung *
397 1.1 dyoung * ixgbe_probe determines if the driver should be loaded on
398 1.1 dyoung * adapter based on PCI vendor/device id of the adapter.
399 1.1 dyoung *
400 1.1 dyoung * return 1 on success, 0 on failure
401 1.1 dyoung *********************************************************************/
402 1.1 dyoung
403 1.1 dyoung static int
404 1.1 dyoung ixgbe_probe(device_t dev, cfdata_t cf, void *aux)
405 1.1 dyoung {
406 1.1 dyoung const struct pci_attach_args *pa = aux;
407 1.1 dyoung
408 1.1 dyoung return (ixgbe_lookup(pa) != NULL) ? 1 : 0;
409 1.1 dyoung }
410 1.1 dyoung
411 1.1 dyoung static ixgbe_vendor_info_t *
412 1.1 dyoung ixgbe_lookup(const struct pci_attach_args *pa)
413 1.1 dyoung {
414 1.1 dyoung pcireg_t subid;
415 1.1 dyoung ixgbe_vendor_info_t *ent;
416 1.1 dyoung
417 1.1 dyoung INIT_DEBUGOUT("ixgbe_probe: begin");
418 1.1 dyoung
419 1.1 dyoung if (PCI_VENDOR(pa->pa_id) != IXGBE_INTEL_VENDOR_ID)
420 1.1 dyoung return NULL;
421 1.1 dyoung
422 1.1 dyoung subid = pci_conf_read(pa->pa_pc, pa->pa_tag, PCI_SUBSYS_ID_REG);
423 1.1 dyoung
424 1.1 dyoung for (ent = ixgbe_vendor_info_array; ent->vendor_id != 0; ent++) {
425 1.1 dyoung if (PCI_VENDOR(pa->pa_id) == ent->vendor_id &&
426 1.1 dyoung PCI_PRODUCT(pa->pa_id) == ent->device_id &&
427 1.1 dyoung
428 1.1 dyoung (PCI_SUBSYS_VENDOR(subid) == ent->subvendor_id ||
429 1.1 dyoung ent->subvendor_id == 0) &&
430 1.1 dyoung
431 1.1 dyoung (PCI_SUBSYS_ID(subid) == ent->subdevice_id ||
432 1.1 dyoung ent->subdevice_id == 0)) {
433 1.1 dyoung ++ixgbe_total_ports;
434 1.1 dyoung return ent;
435 1.1 dyoung }
436 1.1 dyoung }
437 1.1 dyoung return NULL;
438 1.1 dyoung }
439 1.1 dyoung
440 1.1 dyoung
441 1.1 dyoung static void
442 1.1 dyoung ixgbe_sysctl_attach(struct adapter *adapter)
443 1.1 dyoung {
444 1.1 dyoung struct sysctllog **log;
445 1.1 dyoung const struct sysctlnode *rnode, *cnode;
446 1.1 dyoung device_t dev;
447 1.1 dyoung
448 1.1 dyoung dev = adapter->dev;
449 1.1 dyoung log = &adapter->sysctllog;
450 1.1 dyoung
451 1.1 dyoung if ((rnode = ixgbe_sysctl_instance(adapter)) == NULL) {
452 1.1 dyoung aprint_error_dev(dev, "could not create sysctl root\n");
453 1.1 dyoung return;
454 1.1 dyoung }
455 1.1 dyoung
456 1.1 dyoung if (sysctl_createv(log, 0, &rnode, &cnode,
457 1.1 dyoung CTLFLAG_READONLY, CTLTYPE_INT,
458 1.1 dyoung "num_rx_desc", SYSCTL_DESCR("Number of rx descriptors"),
459 1.1 dyoung NULL, 0, &adapter->num_rx_desc, 0, CTL_CREATE, CTL_EOL) != 0)
460 1.1 dyoung aprint_error_dev(dev, "could not create sysctl\n");
461 1.1 dyoung
462 1.1 dyoung if (sysctl_createv(log, 0, &rnode, &cnode,
463 1.1 dyoung CTLFLAG_READONLY, CTLTYPE_INT,
464 1.1 dyoung "num_queues", SYSCTL_DESCR("Number of queues"),
465 1.1 dyoung NULL, 0, &adapter->num_queues, 0, CTL_CREATE, CTL_EOL) != 0)
466 1.1 dyoung aprint_error_dev(dev, "could not create sysctl\n");
467 1.1 dyoung
468 1.1 dyoung if (sysctl_createv(log, 0, &rnode, &cnode,
469 1.1 dyoung CTLFLAG_READWRITE, CTLTYPE_INT,
470 1.14.2.4 riz "fc", SYSCTL_DESCR("Flow Control"),
471 1.3 dsl ixgbe_set_flowcntl, 0, (void *)adapter, 0, CTL_CREATE, CTL_EOL) != 0)
472 1.1 dyoung aprint_error_dev(dev, "could not create sysctl\n");
473 1.1 dyoung
474 1.1 dyoung /* XXX This is an *instance* sysctl controlling a *global* variable.
475 1.1 dyoung * XXX It's that way in the FreeBSD driver that this derives from.
476 1.1 dyoung */
477 1.1 dyoung if (sysctl_createv(log, 0, &rnode, &cnode,
478 1.1 dyoung CTLFLAG_READWRITE, CTLTYPE_INT,
479 1.1 dyoung "enable_aim", SYSCTL_DESCR("Interrupt Moderation"),
480 1.1 dyoung NULL, 0, &ixgbe_enable_aim, 0, CTL_CREATE, CTL_EOL) != 0)
481 1.1 dyoung aprint_error_dev(dev, "could not create sysctl\n");
482 1.14.2.4 riz
483 1.14.2.4 riz if (sysctl_createv(log, 0, &rnode, &cnode,
484 1.14.2.4 riz CTLFLAG_READWRITE, CTLTYPE_INT,
485 1.14.2.4 riz "advertise_speed", SYSCTL_DESCR("Link Speed"),
486 1.14.2.4 riz ixgbe_set_advertise, 0, (void *)adapter, 0, CTL_CREATE, CTL_EOL) != 0)
487 1.14.2.4 riz aprint_error_dev(dev, "could not create sysctl\n");
488 1.14.2.4 riz
489 1.14.2.4 riz if (sysctl_createv(log, 0, &rnode, &cnode,
490 1.14.2.4 riz CTLFLAG_READWRITE, CTLTYPE_INT,
491 1.14.2.4 riz "ts", SYSCTL_DESCR("Thermal Test"),
492 1.14.2.4 riz ixgbe_set_thermal_test, 0, (void *)adapter, 0, CTL_CREATE, CTL_EOL) != 0)
493 1.14.2.4 riz aprint_error_dev(dev, "could not create sysctl\n");
494 1.1 dyoung }
495 1.1 dyoung
496 1.1 dyoung /*********************************************************************
497 1.1 dyoung * Device initialization routine
498 1.1 dyoung *
499 1.1 dyoung * The attach entry point is called when the driver is being loaded.
500 1.1 dyoung * This routine identifies the type of hardware, allocates all resources
501 1.1 dyoung * and initializes the hardware.
502 1.1 dyoung *
503 1.1 dyoung * return 0 on success, positive on failure
504 1.1 dyoung *********************************************************************/
505 1.1 dyoung
506 1.1 dyoung static void
507 1.1 dyoung ixgbe_attach(device_t parent, device_t dev, void *aux)
508 1.1 dyoung {
509 1.1 dyoung struct adapter *adapter;
510 1.1 dyoung struct ixgbe_hw *hw;
511 1.1 dyoung int error = 0;
512 1.1 dyoung u16 csum;
513 1.1 dyoung u32 ctrl_ext;
514 1.1 dyoung ixgbe_vendor_info_t *ent;
515 1.1 dyoung const struct pci_attach_args *pa = aux;
516 1.1 dyoung
517 1.1 dyoung INIT_DEBUGOUT("ixgbe_attach: begin");
518 1.1 dyoung
519 1.1 dyoung /* Allocate, clear, and link in our adapter structure */
520 1.1 dyoung adapter = device_private(dev);
521 1.1 dyoung adapter->dev = adapter->osdep.dev = dev;
522 1.1 dyoung hw = &adapter->hw;
523 1.1 dyoung adapter->osdep.pc = pa->pa_pc;
524 1.1 dyoung adapter->osdep.tag = pa->pa_tag;
525 1.1 dyoung adapter->osdep.dmat = pa->pa_dmat;
526 1.14.2.6 snj adapter->osdep.attached = false;
527 1.1 dyoung
528 1.1 dyoung ent = ixgbe_lookup(pa);
529 1.1 dyoung
530 1.1 dyoung KASSERT(ent != NULL);
531 1.1 dyoung
532 1.1 dyoung aprint_normal(": %s, Version - %s\n",
533 1.1 dyoung ixgbe_strings[ent->index], ixgbe_driver_version);
534 1.1 dyoung
535 1.1 dyoung /* Core Lock Init*/
536 1.1 dyoung IXGBE_CORE_LOCK_INIT(adapter, device_xname(dev));
537 1.1 dyoung
538 1.1 dyoung /* SYSCTL APIs */
539 1.1 dyoung
540 1.1 dyoung ixgbe_sysctl_attach(adapter);
541 1.1 dyoung
542 1.1 dyoung /* Set up the timer callout */
543 1.1 dyoung callout_init(&adapter->timer, 0);
544 1.1 dyoung
545 1.1 dyoung /* Determine hardware revision */
546 1.1 dyoung ixgbe_identify_hardware(adapter);
547 1.1 dyoung
548 1.1 dyoung /* Do base PCI setup - map BAR0 */
549 1.1 dyoung if (ixgbe_allocate_pci_resources(adapter, pa)) {
550 1.1 dyoung aprint_error_dev(dev, "Allocation of PCI resources failed\n");
551 1.1 dyoung error = ENXIO;
552 1.1 dyoung goto err_out;
553 1.1 dyoung }
554 1.1 dyoung
555 1.1 dyoung /* Do descriptor calc and sanity checks */
556 1.1 dyoung if (((ixgbe_txd * sizeof(union ixgbe_adv_tx_desc)) % DBA_ALIGN) != 0 ||
557 1.1 dyoung ixgbe_txd < MIN_TXD || ixgbe_txd > MAX_TXD) {
558 1.1 dyoung aprint_error_dev(dev, "TXD config issue, using default!\n");
559 1.1 dyoung adapter->num_tx_desc = DEFAULT_TXD;
560 1.1 dyoung } else
561 1.1 dyoung adapter->num_tx_desc = ixgbe_txd;
562 1.1 dyoung
563 1.1 dyoung /*
564 1.1 dyoung ** With many RX rings it is easy to exceed the
565 1.1 dyoung ** system mbuf allocation. Tuning nmbclusters
566 1.1 dyoung ** can alleviate this.
567 1.1 dyoung */
568 1.1 dyoung if (nmbclusters > 0 ) {
569 1.1 dyoung int s;
570 1.1 dyoung s = (ixgbe_rxd * adapter->num_queues) * ixgbe_total_ports;
571 1.1 dyoung if (s > nmbclusters) {
572 1.1 dyoung aprint_error_dev(dev, "RX Descriptors exceed "
573 1.1 dyoung "system mbuf max, using default instead!\n");
574 1.1 dyoung ixgbe_rxd = DEFAULT_RXD;
575 1.1 dyoung }
576 1.1 dyoung }
577 1.1 dyoung
578 1.1 dyoung if (((ixgbe_rxd * sizeof(union ixgbe_adv_rx_desc)) % DBA_ALIGN) != 0 ||
579 1.14.2.6 snj ixgbe_rxd < MIN_RXD || ixgbe_rxd > MAX_RXD) {
580 1.1 dyoung aprint_error_dev(dev, "RXD config issue, using default!\n");
581 1.1 dyoung adapter->num_rx_desc = DEFAULT_RXD;
582 1.1 dyoung } else
583 1.1 dyoung adapter->num_rx_desc = ixgbe_rxd;
584 1.1 dyoung
585 1.1 dyoung /* Allocate our TX/RX Queues */
586 1.1 dyoung if (ixgbe_allocate_queues(adapter)) {
587 1.1 dyoung error = ENOMEM;
588 1.1 dyoung goto err_out;
589 1.1 dyoung }
590 1.1 dyoung
591 1.1 dyoung /* Allocate multicast array memory. */
592 1.1 dyoung adapter->mta = malloc(sizeof(u8) * IXGBE_ETH_LENGTH_OF_ADDRESS *
593 1.1 dyoung MAX_NUM_MULTICAST_ADDRESSES, M_DEVBUF, M_NOWAIT);
594 1.1 dyoung if (adapter->mta == NULL) {
595 1.1 dyoung aprint_error_dev(dev, "Cannot allocate multicast setup array\n");
596 1.1 dyoung error = ENOMEM;
597 1.1 dyoung goto err_late;
598 1.1 dyoung }
599 1.1 dyoung
600 1.1 dyoung /* Initialize the shared code */
601 1.14.2.6 snj hw->allow_unsupported_sfp = allow_unsupported_sfp;
602 1.1 dyoung error = ixgbe_init_shared_code(hw);
603 1.1 dyoung if (error == IXGBE_ERR_SFP_NOT_PRESENT) {
604 1.1 dyoung /*
605 1.1 dyoung ** No optics in this port, set up
606 1.1 dyoung ** so the timer routine will probe
607 1.1 dyoung ** for later insertion.
608 1.1 dyoung */
609 1.1 dyoung adapter->sfp_probe = TRUE;
610 1.1 dyoung error = 0;
611 1.1 dyoung } else if (error == IXGBE_ERR_SFP_NOT_SUPPORTED) {
612 1.1 dyoung aprint_error_dev(dev,"Unsupported SFP+ module detected!\n");
613 1.1 dyoung error = EIO;
614 1.1 dyoung goto err_late;
615 1.1 dyoung } else if (error) {
616 1.1 dyoung aprint_error_dev(dev,"Unable to initialize the shared code\n");
617 1.1 dyoung error = EIO;
618 1.1 dyoung goto err_late;
619 1.1 dyoung }
620 1.1 dyoung
621 1.1 dyoung /* Make sure we have a good EEPROM before we read from it */
622 1.1 dyoung if (ixgbe_validate_eeprom_checksum(&adapter->hw, &csum) < 0) {
623 1.1 dyoung aprint_error_dev(dev,"The EEPROM Checksum Is Not Valid\n");
624 1.1 dyoung error = EIO;
625 1.1 dyoung goto err_late;
626 1.1 dyoung }
627 1.1 dyoung
628 1.1 dyoung error = ixgbe_init_hw(hw);
629 1.14.2.4 riz switch (error) {
630 1.14.2.4 riz case IXGBE_ERR_EEPROM_VERSION:
631 1.1 dyoung aprint_error_dev(dev, "This device is a pre-production adapter/"
632 1.1 dyoung "LOM. Please be aware there may be issues associated "
633 1.1 dyoung "with your hardware.\n If you are experiencing problems "
634 1.1 dyoung "please contact your Intel or hardware representative "
635 1.1 dyoung "who provided you with this hardware.\n");
636 1.14.2.4 riz break;
637 1.14.2.4 riz case IXGBE_ERR_SFP_NOT_SUPPORTED:
638 1.1 dyoung aprint_error_dev(dev,"Unsupported SFP+ Module\n");
639 1.1 dyoung error = EIO;
640 1.1 dyoung aprint_error_dev(dev,"Hardware Initialization Failure\n");
641 1.1 dyoung goto err_late;
642 1.14.2.4 riz case IXGBE_ERR_SFP_NOT_PRESENT:
643 1.14.2.4 riz device_printf(dev,"No SFP+ Module found\n");
644 1.14.2.4 riz /* falls thru */
645 1.14.2.4 riz default:
646 1.14.2.4 riz break;
647 1.1 dyoung }
648 1.1 dyoung
649 1.1 dyoung /* Detect and set physical type */
650 1.1 dyoung ixgbe_setup_optics(adapter);
651 1.1 dyoung
652 1.1 dyoung if ((adapter->msix > 1) && (ixgbe_enable_msix))
653 1.1 dyoung error = ixgbe_allocate_msix(adapter, pa);
654 1.1 dyoung else
655 1.1 dyoung error = ixgbe_allocate_legacy(adapter, pa);
656 1.1 dyoung if (error)
657 1.1 dyoung goto err_late;
658 1.1 dyoung
659 1.1 dyoung /* Setup OS specific network interface */
660 1.1 dyoung if (ixgbe_setup_interface(dev, adapter) != 0)
661 1.1 dyoung goto err_late;
662 1.1 dyoung
663 1.1 dyoung /* Initialize statistics */
664 1.1 dyoung ixgbe_update_stats_counters(adapter);
665 1.1 dyoung
666 1.14.2.6 snj /*
667 1.14.2.6 snj ** Check PCIE slot type/speed/width
668 1.14.2.6 snj */
669 1.14.2.6 snj ixgbe_get_slot_info(hw);
670 1.1 dyoung
671 1.14.2.5 riz /* Set an initial default flow control value */
672 1.14.2.5 riz adapter->fc = ixgbe_fc_full;
673 1.14.2.5 riz
674 1.1 dyoung /* let hardware know driver is loaded */
675 1.1 dyoung ctrl_ext = IXGBE_READ_REG(hw, IXGBE_CTRL_EXT);
676 1.1 dyoung ctrl_ext |= IXGBE_CTRL_EXT_DRV_LOAD;
677 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_CTRL_EXT, ctrl_ext);
678 1.1 dyoung
679 1.1 dyoung ixgbe_add_hw_stats(adapter);
680 1.1 dyoung
681 1.14.2.3 martin #ifdef DEV_NETMAP
682 1.14.2.3 martin ixgbe_netmap_attach(adapter);
683 1.14.2.3 martin #endif /* DEV_NETMAP */
684 1.1 dyoung INIT_DEBUGOUT("ixgbe_attach: end");
685 1.14.2.6 snj adapter->osdep.attached = true;
686 1.1 dyoung return;
687 1.1 dyoung err_late:
688 1.1 dyoung ixgbe_free_transmit_structures(adapter);
689 1.1 dyoung ixgbe_free_receive_structures(adapter);
690 1.1 dyoung err_out:
691 1.1 dyoung if (adapter->ifp != NULL)
692 1.1 dyoung if_free(adapter->ifp);
693 1.1 dyoung ixgbe_free_pci_resources(adapter);
694 1.1 dyoung if (adapter->mta != NULL)
695 1.1 dyoung free(adapter->mta, M_DEVBUF);
696 1.1 dyoung return;
697 1.1 dyoung
698 1.1 dyoung }
699 1.1 dyoung
700 1.1 dyoung /*********************************************************************
701 1.1 dyoung * Device removal routine
702 1.1 dyoung *
703 1.1 dyoung * The detach entry point is called when the driver is being removed.
704 1.1 dyoung * This routine stops the adapter and deallocates all the resources
705 1.1 dyoung * that were allocated for driver operation.
706 1.1 dyoung *
707 1.1 dyoung * return 0 on success, positive on failure
708 1.1 dyoung *********************************************************************/
709 1.1 dyoung
710 1.1 dyoung static int
711 1.1 dyoung ixgbe_detach(device_t dev, int flags)
712 1.1 dyoung {
713 1.1 dyoung struct adapter *adapter = device_private(dev);
714 1.1 dyoung struct rx_ring *rxr = adapter->rx_rings;
715 1.1 dyoung struct ixgbe_hw_stats *stats = &adapter->stats;
716 1.1 dyoung struct ix_queue *que = adapter->queues;
717 1.14.2.4 riz struct tx_ring *txr = adapter->tx_rings;
718 1.1 dyoung u32 ctrl_ext;
719 1.1 dyoung
720 1.1 dyoung INIT_DEBUGOUT("ixgbe_detach: begin");
721 1.14.2.6 snj if (adapter->osdep.attached == false)
722 1.14.2.6 snj return 0;
723 1.1 dyoung
724 1.14.2.5 riz #if NVLAN > 0
725 1.1 dyoung /* Make sure VLANs are not using driver */
726 1.1 dyoung if (!VLAN_ATTACHED(&adapter->osdep.ec))
727 1.1 dyoung ; /* nothing to do: no VLANs */
728 1.1 dyoung else if ((flags & (DETACH_SHUTDOWN|DETACH_FORCE)) != 0)
729 1.1 dyoung vlan_ifdetach(adapter->ifp);
730 1.1 dyoung else {
731 1.1 dyoung aprint_error_dev(dev, "VLANs in use\n");
732 1.1 dyoung return EBUSY;
733 1.1 dyoung }
734 1.14.2.5 riz #endif
735 1.1 dyoung
736 1.1 dyoung IXGBE_CORE_LOCK(adapter);
737 1.1 dyoung ixgbe_stop(adapter);
738 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
739 1.1 dyoung
740 1.14.2.4 riz for (int i = 0; i < adapter->num_queues; i++, que++, txr++) {
741 1.14.2.5 riz #ifndef IXGBE_LEGACY_TX
742 1.14.2.4 riz softint_disestablish(txr->txq_si);
743 1.14.2.4 riz #endif
744 1.1 dyoung softint_disestablish(que->que_si);
745 1.1 dyoung }
746 1.1 dyoung
747 1.1 dyoung /* Drain the Link queue */
748 1.1 dyoung softint_disestablish(adapter->link_si);
749 1.1 dyoung softint_disestablish(adapter->mod_si);
750 1.1 dyoung softint_disestablish(adapter->msf_si);
751 1.1 dyoung #ifdef IXGBE_FDIR
752 1.1 dyoung softint_disestablish(adapter->fdir_si);
753 1.1 dyoung #endif
754 1.1 dyoung
755 1.1 dyoung /* let hardware know driver is unloading */
756 1.1 dyoung ctrl_ext = IXGBE_READ_REG(&adapter->hw, IXGBE_CTRL_EXT);
757 1.1 dyoung ctrl_ext &= ~IXGBE_CTRL_EXT_DRV_LOAD;
758 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_CTRL_EXT, ctrl_ext);
759 1.1 dyoung
760 1.1 dyoung ether_ifdetach(adapter->ifp);
761 1.1 dyoung callout_halt(&adapter->timer, NULL);
762 1.14.2.3 martin #ifdef DEV_NETMAP
763 1.14.2.3 martin netmap_detach(adapter->ifp);
764 1.14.2.3 martin #endif /* DEV_NETMAP */
765 1.1 dyoung ixgbe_free_pci_resources(adapter);
766 1.1 dyoung #if 0 /* XXX the NetBSD port is probably missing something here */
767 1.1 dyoung bus_generic_detach(dev);
768 1.1 dyoung #endif
769 1.1 dyoung if_detach(adapter->ifp);
770 1.1 dyoung
771 1.1 dyoung sysctl_teardown(&adapter->sysctllog);
772 1.1 dyoung evcnt_detach(&adapter->handleq);
773 1.1 dyoung evcnt_detach(&adapter->req);
774 1.1 dyoung evcnt_detach(&adapter->morerx);
775 1.1 dyoung evcnt_detach(&adapter->moretx);
776 1.1 dyoung evcnt_detach(&adapter->txloops);
777 1.1 dyoung evcnt_detach(&adapter->efbig_tx_dma_setup);
778 1.1 dyoung evcnt_detach(&adapter->m_defrag_failed);
779 1.1 dyoung evcnt_detach(&adapter->efbig2_tx_dma_setup);
780 1.1 dyoung evcnt_detach(&adapter->einval_tx_dma_setup);
781 1.1 dyoung evcnt_detach(&adapter->other_tx_dma_setup);
782 1.1 dyoung evcnt_detach(&adapter->eagain_tx_dma_setup);
783 1.1 dyoung evcnt_detach(&adapter->enomem_tx_dma_setup);
784 1.1 dyoung evcnt_detach(&adapter->watchdog_events);
785 1.1 dyoung evcnt_detach(&adapter->tso_err);
786 1.1 dyoung evcnt_detach(&adapter->link_irq);
787 1.14.2.4 riz
788 1.14.2.4 riz txr = adapter->tx_rings;
789 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, rxr++, txr++) {
790 1.1 dyoung evcnt_detach(&txr->no_desc_avail);
791 1.1 dyoung evcnt_detach(&txr->total_packets);
792 1.14.2.5 riz evcnt_detach(&txr->tso_tx);
793 1.1 dyoung
794 1.1 dyoung if (i < __arraycount(adapter->stats.mpc)) {
795 1.1 dyoung evcnt_detach(&adapter->stats.mpc[i]);
796 1.1 dyoung }
797 1.1 dyoung if (i < __arraycount(adapter->stats.pxontxc)) {
798 1.1 dyoung evcnt_detach(&adapter->stats.pxontxc[i]);
799 1.1 dyoung evcnt_detach(&adapter->stats.pxonrxc[i]);
800 1.1 dyoung evcnt_detach(&adapter->stats.pxofftxc[i]);
801 1.1 dyoung evcnt_detach(&adapter->stats.pxoffrxc[i]);
802 1.1 dyoung evcnt_detach(&adapter->stats.pxon2offc[i]);
803 1.1 dyoung }
804 1.1 dyoung if (i < __arraycount(adapter->stats.qprc)) {
805 1.1 dyoung evcnt_detach(&adapter->stats.qprc[i]);
806 1.1 dyoung evcnt_detach(&adapter->stats.qptc[i]);
807 1.1 dyoung evcnt_detach(&adapter->stats.qbrc[i]);
808 1.1 dyoung evcnt_detach(&adapter->stats.qbtc[i]);
809 1.1 dyoung evcnt_detach(&adapter->stats.qprdc[i]);
810 1.1 dyoung }
811 1.1 dyoung
812 1.1 dyoung evcnt_detach(&rxr->rx_packets);
813 1.1 dyoung evcnt_detach(&rxr->rx_bytes);
814 1.14.2.6 snj evcnt_detach(&rxr->rx_copies);
815 1.1 dyoung evcnt_detach(&rxr->no_jmbuf);
816 1.1 dyoung evcnt_detach(&rxr->rx_discarded);
817 1.1 dyoung evcnt_detach(&rxr->rx_irq);
818 1.1 dyoung }
819 1.1 dyoung evcnt_detach(&stats->ipcs);
820 1.1 dyoung evcnt_detach(&stats->l4cs);
821 1.1 dyoung evcnt_detach(&stats->ipcs_bad);
822 1.1 dyoung evcnt_detach(&stats->l4cs_bad);
823 1.1 dyoung evcnt_detach(&stats->intzero);
824 1.1 dyoung evcnt_detach(&stats->legint);
825 1.1 dyoung evcnt_detach(&stats->crcerrs);
826 1.1 dyoung evcnt_detach(&stats->illerrc);
827 1.1 dyoung evcnt_detach(&stats->errbc);
828 1.1 dyoung evcnt_detach(&stats->mspdc);
829 1.1 dyoung evcnt_detach(&stats->mlfc);
830 1.1 dyoung evcnt_detach(&stats->mrfc);
831 1.1 dyoung evcnt_detach(&stats->rlec);
832 1.1 dyoung evcnt_detach(&stats->lxontxc);
833 1.1 dyoung evcnt_detach(&stats->lxonrxc);
834 1.1 dyoung evcnt_detach(&stats->lxofftxc);
835 1.1 dyoung evcnt_detach(&stats->lxoffrxc);
836 1.1 dyoung
837 1.1 dyoung /* Packet Reception Stats */
838 1.1 dyoung evcnt_detach(&stats->tor);
839 1.1 dyoung evcnt_detach(&stats->gorc);
840 1.1 dyoung evcnt_detach(&stats->tpr);
841 1.1 dyoung evcnt_detach(&stats->gprc);
842 1.1 dyoung evcnt_detach(&stats->mprc);
843 1.1 dyoung evcnt_detach(&stats->bprc);
844 1.1 dyoung evcnt_detach(&stats->prc64);
845 1.1 dyoung evcnt_detach(&stats->prc127);
846 1.1 dyoung evcnt_detach(&stats->prc255);
847 1.1 dyoung evcnt_detach(&stats->prc511);
848 1.1 dyoung evcnt_detach(&stats->prc1023);
849 1.1 dyoung evcnt_detach(&stats->prc1522);
850 1.1 dyoung evcnt_detach(&stats->ruc);
851 1.1 dyoung evcnt_detach(&stats->rfc);
852 1.1 dyoung evcnt_detach(&stats->roc);
853 1.1 dyoung evcnt_detach(&stats->rjc);
854 1.1 dyoung evcnt_detach(&stats->mngprc);
855 1.1 dyoung evcnt_detach(&stats->xec);
856 1.1 dyoung
857 1.1 dyoung /* Packet Transmission Stats */
858 1.1 dyoung evcnt_detach(&stats->gotc);
859 1.1 dyoung evcnt_detach(&stats->tpt);
860 1.1 dyoung evcnt_detach(&stats->gptc);
861 1.1 dyoung evcnt_detach(&stats->bptc);
862 1.1 dyoung evcnt_detach(&stats->mptc);
863 1.1 dyoung evcnt_detach(&stats->mngptc);
864 1.1 dyoung evcnt_detach(&stats->ptc64);
865 1.1 dyoung evcnt_detach(&stats->ptc127);
866 1.1 dyoung evcnt_detach(&stats->ptc255);
867 1.1 dyoung evcnt_detach(&stats->ptc511);
868 1.1 dyoung evcnt_detach(&stats->ptc1023);
869 1.1 dyoung evcnt_detach(&stats->ptc1522);
870 1.1 dyoung
871 1.1 dyoung ixgbe_free_transmit_structures(adapter);
872 1.1 dyoung ixgbe_free_receive_structures(adapter);
873 1.1 dyoung free(adapter->mta, M_DEVBUF);
874 1.1 dyoung
875 1.1 dyoung IXGBE_CORE_LOCK_DESTROY(adapter);
876 1.1 dyoung return (0);
877 1.1 dyoung }
878 1.1 dyoung
879 1.1 dyoung /*********************************************************************
880 1.1 dyoung *
881 1.1 dyoung * Shutdown entry point
882 1.1 dyoung *
883 1.1 dyoung **********************************************************************/
884 1.1 dyoung
885 1.1 dyoung #if 0 /* XXX NetBSD ought to register something like this through pmf(9) */
886 1.1 dyoung static int
887 1.1 dyoung ixgbe_shutdown(device_t dev)
888 1.1 dyoung {
889 1.1 dyoung struct adapter *adapter = device_private(dev);
890 1.1 dyoung IXGBE_CORE_LOCK(adapter);
891 1.1 dyoung ixgbe_stop(adapter);
892 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
893 1.1 dyoung return (0);
894 1.1 dyoung }
895 1.1 dyoung #endif
896 1.1 dyoung
897 1.1 dyoung
898 1.14.2.5 riz #ifdef IXGBE_LEGACY_TX
899 1.1 dyoung /*********************************************************************
900 1.1 dyoung * Transmit entry point
901 1.1 dyoung *
902 1.1 dyoung * ixgbe_start is called by the stack to initiate a transmit.
903 1.1 dyoung * The driver will remain in this routine as long as there are
904 1.1 dyoung * packets to transmit and transmit resources are available.
905 1.1 dyoung * In case resources are not available stack is notified and
906 1.1 dyoung * the packet is requeued.
907 1.1 dyoung **********************************************************************/
908 1.1 dyoung
909 1.1 dyoung static void
910 1.1 dyoung ixgbe_start_locked(struct tx_ring *txr, struct ifnet * ifp)
911 1.1 dyoung {
912 1.1 dyoung int rc;
913 1.1 dyoung struct mbuf *m_head;
914 1.1 dyoung struct adapter *adapter = txr->adapter;
915 1.1 dyoung
916 1.1 dyoung IXGBE_TX_LOCK_ASSERT(txr);
917 1.1 dyoung
918 1.14.2.4 riz if ((ifp->if_flags & IFF_RUNNING) == 0)
919 1.1 dyoung return;
920 1.1 dyoung if (!adapter->link_active)
921 1.1 dyoung return;
922 1.1 dyoung
923 1.1 dyoung while (!IFQ_IS_EMPTY(&ifp->if_snd)) {
924 1.14.2.4 riz if (txr->tx_avail <= IXGBE_QUEUE_MIN_FREE)
925 1.14.2.4 riz break;
926 1.1 dyoung
927 1.1 dyoung IFQ_POLL(&ifp->if_snd, m_head);
928 1.1 dyoung if (m_head == NULL)
929 1.1 dyoung break;
930 1.1 dyoung
931 1.1 dyoung if ((rc = ixgbe_xmit(txr, m_head)) == EAGAIN) {
932 1.1 dyoung break;
933 1.1 dyoung }
934 1.1 dyoung IFQ_DEQUEUE(&ifp->if_snd, m_head);
935 1.1 dyoung if (rc == EFBIG) {
936 1.1 dyoung struct mbuf *mtmp;
937 1.1 dyoung
938 1.14.2.5 riz if ((mtmp = m_defrag(m_head, M_NOWAIT)) != NULL) {
939 1.1 dyoung m_head = mtmp;
940 1.1 dyoung rc = ixgbe_xmit(txr, m_head);
941 1.1 dyoung if (rc != 0)
942 1.1 dyoung adapter->efbig2_tx_dma_setup.ev_count++;
943 1.1 dyoung } else
944 1.1 dyoung adapter->m_defrag_failed.ev_count++;
945 1.1 dyoung }
946 1.1 dyoung if (rc != 0) {
947 1.1 dyoung m_freem(m_head);
948 1.1 dyoung continue;
949 1.1 dyoung }
950 1.1 dyoung
951 1.1 dyoung /* Send a copy of the frame to the BPF listener */
952 1.1 dyoung bpf_mtap(ifp, m_head);
953 1.1 dyoung
954 1.1 dyoung /* Set watchdog on */
955 1.1 dyoung getmicrotime(&txr->watchdog_time);
956 1.1 dyoung txr->queue_status = IXGBE_QUEUE_WORKING;
957 1.1 dyoung
958 1.1 dyoung }
959 1.1 dyoung return;
960 1.1 dyoung }
961 1.1 dyoung
962 1.1 dyoung /*
963 1.1 dyoung * Legacy TX start - called by the stack, this
964 1.1 dyoung * always uses the first tx ring, and should
965 1.1 dyoung * not be used with multiqueue tx enabled.
966 1.1 dyoung */
967 1.1 dyoung static void
968 1.1 dyoung ixgbe_start(struct ifnet *ifp)
969 1.1 dyoung {
970 1.1 dyoung struct adapter *adapter = ifp->if_softc;
971 1.1 dyoung struct tx_ring *txr = adapter->tx_rings;
972 1.1 dyoung
973 1.1 dyoung if (ifp->if_flags & IFF_RUNNING) {
974 1.1 dyoung IXGBE_TX_LOCK(txr);
975 1.1 dyoung ixgbe_start_locked(txr, ifp);
976 1.1 dyoung IXGBE_TX_UNLOCK(txr);
977 1.1 dyoung }
978 1.1 dyoung return;
979 1.1 dyoung }
980 1.1 dyoung
981 1.14.2.5 riz #else /* ! IXGBE_LEGACY_TX */
982 1.14.2.5 riz
983 1.1 dyoung /*
984 1.1 dyoung ** Multiqueue Transmit driver
985 1.1 dyoung **
986 1.1 dyoung */
987 1.1 dyoung static int
988 1.1 dyoung ixgbe_mq_start(struct ifnet *ifp, struct mbuf *m)
989 1.1 dyoung {
990 1.1 dyoung struct adapter *adapter = ifp->if_softc;
991 1.1 dyoung struct ix_queue *que;
992 1.1 dyoung struct tx_ring *txr;
993 1.14.2.6 snj int i, err = 0;
994 1.14.2.6 snj #ifdef RSS
995 1.14.2.6 snj uint32_t bucket_id;
996 1.14.2.6 snj #endif
997 1.1 dyoung
998 1.1 dyoung /* Which queue to use */
999 1.14.2.6 snj /*
1000 1.14.2.6 snj * When doing RSS, map it to the same outbound queue
1001 1.14.2.6 snj * as the incoming flow would be mapped to.
1002 1.14.2.6 snj *
1003 1.14.2.6 snj * If everything is setup correctly, it should be the
1004 1.14.2.6 snj * same bucket that the current CPU we're on is.
1005 1.14.2.6 snj */
1006 1.14.2.6 snj if (M_HASHTYPE_GET(m) != M_HASHTYPE_NONE) {
1007 1.14.2.6 snj #ifdef RSS
1008 1.14.2.6 snj if (rss_hash2bucket(m->m_pkthdr.flowid,
1009 1.14.2.6 snj M_HASHTYPE_GET(m), &bucket_id) == 0) {
1010 1.14.2.6 snj /* XXX TODO: spit out something if bucket_id > num_queues? */
1011 1.14.2.6 snj i = bucket_id % adapter->num_queues;
1012 1.14.2.6 snj } else {
1013 1.14.2.6 snj #endif
1014 1.14.2.6 snj i = m->m_pkthdr.flowid % adapter->num_queues;
1015 1.14.2.6 snj #ifdef RSS
1016 1.14.2.6 snj }
1017 1.14.2.6 snj #endif
1018 1.14.2.6 snj } else {
1019 1.14.2.6 snj i = curcpu % adapter->num_queues;
1020 1.14.2.6 snj }
1021 1.1 dyoung
1022 1.1 dyoung txr = &adapter->tx_rings[i];
1023 1.1 dyoung que = &adapter->queues[i];
1024 1.1 dyoung
1025 1.14.2.6 snj err = drbr_enqueue(ifp, txr->br, m);
1026 1.14.2.6 snj if (err)
1027 1.14.2.6 snj return (err);
1028 1.1 dyoung if (IXGBE_TX_TRYLOCK(txr)) {
1029 1.14.2.6 snj ixgbe_mq_start_locked(ifp, txr);
1030 1.1 dyoung IXGBE_TX_UNLOCK(txr);
1031 1.14.2.6 snj } else
1032 1.14.2.4 riz softint_schedule(txr->txq_si);
1033 1.1 dyoung
1034 1.14.2.6 snj return (0);
1035 1.1 dyoung }
1036 1.1 dyoung
1037 1.1 dyoung static int
1038 1.14.2.6 snj ixgbe_mq_start_locked(struct ifnet *ifp, struct tx_ring *txr)
1039 1.1 dyoung {
1040 1.1 dyoung struct adapter *adapter = txr->adapter;
1041 1.14.2.6 snj struct mbuf *next;
1042 1.14.2.6 snj int enqueued = 0, err = 0;
1043 1.1 dyoung
1044 1.14.2.4 riz if (((ifp->if_flags & IFF_RUNNING) == 0) ||
1045 1.14.2.6 snj adapter->link_active == 0)
1046 1.14.2.6 snj return (ENETDOWN);
1047 1.1 dyoung
1048 1.1 dyoung /* Process the queue */
1049 1.14.2.6 snj #if __FreeBSD_version < 901504
1050 1.14.2.6 snj next = drbr_dequeue(ifp, txr->br);
1051 1.14.2.6 snj while (next != NULL) {
1052 1.14.2.6 snj if ((err = ixgbe_xmit(txr, &next)) != 0) {
1053 1.14.2.6 snj if (next != NULL)
1054 1.14.2.6 snj err = drbr_enqueue(ifp, txr->br, next);
1055 1.14.2.6 snj #else
1056 1.14.2.5 riz while ((next = drbr_peek(ifp, txr->br)) != NULL) {
1057 1.1 dyoung if ((err = ixgbe_xmit(txr, &next)) != 0) {
1058 1.14.2.5 riz if (next == NULL) {
1059 1.14.2.5 riz drbr_advance(ifp, txr->br);
1060 1.14.2.5 riz } else {
1061 1.14.2.5 riz drbr_putback(ifp, txr->br, next);
1062 1.14.2.5 riz }
1063 1.14.2.6 snj #endif
1064 1.1 dyoung break;
1065 1.1 dyoung }
1066 1.14.2.6 snj #if __FreeBSD_version >= 901504
1067 1.14.2.5 riz drbr_advance(ifp, txr->br);
1068 1.14.2.6 snj #endif
1069 1.1 dyoung enqueued++;
1070 1.1 dyoung /* Send a copy of the frame to the BPF listener */
1071 1.1 dyoung bpf_mtap(ifp, next);
1072 1.1 dyoung if ((ifp->if_flags & IFF_RUNNING) == 0)
1073 1.1 dyoung break;
1074 1.14.2.6 snj #if __FreeBSD_version < 901504
1075 1.14.2.6 snj next = drbr_dequeue(ifp, txr->br);
1076 1.14.2.6 snj #endif
1077 1.1 dyoung }
1078 1.1 dyoung
1079 1.1 dyoung if (enqueued > 0) {
1080 1.1 dyoung /* Set watchdog on */
1081 1.1 dyoung txr->queue_status = IXGBE_QUEUE_WORKING;
1082 1.1 dyoung getmicrotime(&txr->watchdog_time);
1083 1.1 dyoung }
1084 1.1 dyoung
1085 1.14.2.4 riz if (txr->tx_avail < IXGBE_TX_CLEANUP_THRESHOLD)
1086 1.14.2.4 riz ixgbe_txeof(txr);
1087 1.14.2.4 riz
1088 1.1 dyoung return (err);
1089 1.1 dyoung }
1090 1.1 dyoung
1091 1.1 dyoung /*
1092 1.14.2.4 riz * Called from a taskqueue to drain queued transmit packets.
1093 1.14.2.4 riz */
1094 1.14.2.4 riz static void
1095 1.14.2.6 snj ixgbe_deferred_mq_start(void *arg, int pending)
1096 1.14.2.4 riz {
1097 1.14.2.4 riz struct tx_ring *txr = arg;
1098 1.14.2.4 riz struct adapter *adapter = txr->adapter;
1099 1.14.2.4 riz struct ifnet *ifp = adapter->ifp;
1100 1.14.2.4 riz
1101 1.14.2.4 riz IXGBE_TX_LOCK(txr);
1102 1.14.2.4 riz if (!drbr_empty(ifp, txr->br))
1103 1.14.2.6 snj ixgbe_mq_start_locked(ifp, txr);
1104 1.14.2.4 riz IXGBE_TX_UNLOCK(txr);
1105 1.14.2.4 riz }
1106 1.14.2.4 riz
1107 1.14.2.4 riz /*
1108 1.1 dyoung ** Flush all ring buffers
1109 1.1 dyoung */
1110 1.1 dyoung static void
1111 1.1 dyoung ixgbe_qflush(struct ifnet *ifp)
1112 1.1 dyoung {
1113 1.1 dyoung struct adapter *adapter = ifp->if_softc;
1114 1.1 dyoung struct tx_ring *txr = adapter->tx_rings;
1115 1.1 dyoung struct mbuf *m;
1116 1.1 dyoung
1117 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, txr++) {
1118 1.1 dyoung IXGBE_TX_LOCK(txr);
1119 1.1 dyoung while ((m = buf_ring_dequeue_sc(txr->br)) != NULL)
1120 1.1 dyoung m_freem(m);
1121 1.1 dyoung IXGBE_TX_UNLOCK(txr);
1122 1.1 dyoung }
1123 1.1 dyoung if_qflush(ifp);
1124 1.1 dyoung }
1125 1.14.2.5 riz #endif /* IXGBE_LEGACY_TX */
1126 1.1 dyoung
1127 1.1 dyoung static int
1128 1.1 dyoung ixgbe_ifflags_cb(struct ethercom *ec)
1129 1.1 dyoung {
1130 1.1 dyoung struct ifnet *ifp = &ec->ec_if;
1131 1.1 dyoung struct adapter *adapter = ifp->if_softc;
1132 1.1 dyoung int change = ifp->if_flags ^ adapter->if_flags, rc = 0;
1133 1.1 dyoung
1134 1.1 dyoung IXGBE_CORE_LOCK(adapter);
1135 1.1 dyoung
1136 1.1 dyoung if (change != 0)
1137 1.1 dyoung adapter->if_flags = ifp->if_flags;
1138 1.1 dyoung
1139 1.1 dyoung if ((change & ~(IFF_CANTCHANGE|IFF_DEBUG)) != 0)
1140 1.1 dyoung rc = ENETRESET;
1141 1.1 dyoung else if ((change & (IFF_PROMISC | IFF_ALLMULTI)) != 0)
1142 1.1 dyoung ixgbe_set_promisc(adapter);
1143 1.1 dyoung
1144 1.14.2.3 martin /* Set up VLAN support and filter */
1145 1.14.2.3 martin ixgbe_setup_vlan_hw_support(adapter);
1146 1.14.2.3 martin
1147 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
1148 1.1 dyoung
1149 1.1 dyoung return rc;
1150 1.1 dyoung }
1151 1.1 dyoung
1152 1.1 dyoung /*********************************************************************
1153 1.1 dyoung * Ioctl entry point
1154 1.1 dyoung *
1155 1.1 dyoung * ixgbe_ioctl is called when the user wants to configure the
1156 1.1 dyoung * interface.
1157 1.1 dyoung *
1158 1.1 dyoung * return 0 on success, positive on failure
1159 1.1 dyoung **********************************************************************/
1160 1.1 dyoung
1161 1.1 dyoung static int
1162 1.1 dyoung ixgbe_ioctl(struct ifnet * ifp, u_long command, void *data)
1163 1.1 dyoung {
1164 1.1 dyoung struct adapter *adapter = ifp->if_softc;
1165 1.14.2.5 riz struct ixgbe_hw *hw = &adapter->hw;
1166 1.1 dyoung struct ifcapreq *ifcr = data;
1167 1.1 dyoung struct ifreq *ifr = data;
1168 1.1 dyoung int error = 0;
1169 1.1 dyoung int l4csum_en;
1170 1.1 dyoung const int l4csum = IFCAP_CSUM_TCPv4_Rx|IFCAP_CSUM_UDPv4_Rx|
1171 1.1 dyoung IFCAP_CSUM_TCPv6_Rx|IFCAP_CSUM_UDPv6_Rx;
1172 1.1 dyoung
1173 1.1 dyoung switch (command) {
1174 1.1 dyoung case SIOCSIFFLAGS:
1175 1.1 dyoung IOCTL_DEBUGOUT("ioctl: SIOCSIFFLAGS (Set Interface Flags)");
1176 1.1 dyoung break;
1177 1.1 dyoung case SIOCADDMULTI:
1178 1.1 dyoung case SIOCDELMULTI:
1179 1.1 dyoung IOCTL_DEBUGOUT("ioctl: SIOC(ADD|DEL)MULTI");
1180 1.1 dyoung break;
1181 1.1 dyoung case SIOCSIFMEDIA:
1182 1.1 dyoung case SIOCGIFMEDIA:
1183 1.1 dyoung IOCTL_DEBUGOUT("ioctl: SIOCxIFMEDIA (Get/Set Interface Media)");
1184 1.1 dyoung break;
1185 1.1 dyoung case SIOCSIFCAP:
1186 1.1 dyoung IOCTL_DEBUGOUT("ioctl: SIOCSIFCAP (Set Capabilities)");
1187 1.1 dyoung break;
1188 1.1 dyoung case SIOCSIFMTU:
1189 1.1 dyoung IOCTL_DEBUGOUT("ioctl: SIOCSIFMTU (Set Interface MTU)");
1190 1.1 dyoung break;
1191 1.1 dyoung default:
1192 1.1 dyoung IOCTL_DEBUGOUT1("ioctl: UNKNOWN (0x%X)\n", (int)command);
1193 1.1 dyoung break;
1194 1.1 dyoung }
1195 1.1 dyoung
1196 1.1 dyoung switch (command) {
1197 1.1 dyoung case SIOCSIFMEDIA:
1198 1.1 dyoung case SIOCGIFMEDIA:
1199 1.1 dyoung return ifmedia_ioctl(ifp, ifr, &adapter->media, command);
1200 1.14.2.5 riz case SIOCGI2C:
1201 1.14.2.5 riz {
1202 1.14.2.5 riz struct ixgbe_i2c_req i2c;
1203 1.14.2.5 riz IOCTL_DEBUGOUT("ioctl: SIOCGI2C (Get I2C Data)");
1204 1.14.2.5 riz error = copyin(ifr->ifr_data, &i2c, sizeof(i2c));
1205 1.14.2.6 snj if (error != 0)
1206 1.14.2.6 snj break;
1207 1.14.2.6 snj if (i2c.dev_addr != 0xA0 && i2c.dev_addr != 0xA2) {
1208 1.14.2.6 snj error = EINVAL;
1209 1.14.2.5 riz break;
1210 1.14.2.6 snj }
1211 1.14.2.6 snj if (i2c.len > sizeof(i2c.data)) {
1212 1.14.2.5 riz error = EINVAL;
1213 1.14.2.5 riz break;
1214 1.14.2.5 riz }
1215 1.14.2.6 snj
1216 1.14.2.5 riz hw->phy.ops.read_i2c_byte(hw, i2c.offset,
1217 1.14.2.5 riz i2c.dev_addr, i2c.data);
1218 1.14.2.5 riz error = copyout(&i2c, ifr->ifr_data, sizeof(i2c));
1219 1.14.2.5 riz break;
1220 1.14.2.5 riz }
1221 1.1 dyoung case SIOCSIFCAP:
1222 1.1 dyoung /* Layer-4 Rx checksum offload has to be turned on and
1223 1.1 dyoung * off as a unit.
1224 1.1 dyoung */
1225 1.1 dyoung l4csum_en = ifcr->ifcr_capenable & l4csum;
1226 1.1 dyoung if (l4csum_en != l4csum && l4csum_en != 0)
1227 1.1 dyoung return EINVAL;
1228 1.1 dyoung /*FALLTHROUGH*/
1229 1.1 dyoung case SIOCADDMULTI:
1230 1.1 dyoung case SIOCDELMULTI:
1231 1.1 dyoung case SIOCSIFFLAGS:
1232 1.1 dyoung case SIOCSIFMTU:
1233 1.1 dyoung default:
1234 1.1 dyoung if ((error = ether_ioctl(ifp, command, data)) != ENETRESET)
1235 1.1 dyoung return error;
1236 1.1 dyoung if ((ifp->if_flags & IFF_RUNNING) == 0)
1237 1.1 dyoung ;
1238 1.1 dyoung else if (command == SIOCSIFCAP || command == SIOCSIFMTU) {
1239 1.1 dyoung IXGBE_CORE_LOCK(adapter);
1240 1.1 dyoung ixgbe_init_locked(adapter);
1241 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
1242 1.1 dyoung } else if (command == SIOCADDMULTI || command == SIOCDELMULTI) {
1243 1.1 dyoung /*
1244 1.1 dyoung * Multicast list has changed; set the hardware filter
1245 1.1 dyoung * accordingly.
1246 1.1 dyoung */
1247 1.1 dyoung IXGBE_CORE_LOCK(adapter);
1248 1.1 dyoung ixgbe_disable_intr(adapter);
1249 1.1 dyoung ixgbe_set_multi(adapter);
1250 1.1 dyoung ixgbe_enable_intr(adapter);
1251 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
1252 1.1 dyoung }
1253 1.1 dyoung return 0;
1254 1.1 dyoung }
1255 1.14.2.5 riz
1256 1.14.2.5 riz return error;
1257 1.1 dyoung }
1258 1.1 dyoung
1259 1.1 dyoung /*********************************************************************
1260 1.1 dyoung * Init entry point
1261 1.1 dyoung *
1262 1.1 dyoung * This routine is used in two ways. It is used by the stack as
1263 1.1 dyoung * init entry point in network interface structure. It is also used
1264 1.1 dyoung * by the driver as a hw/sw initialization routine to get to a
1265 1.1 dyoung * consistent state.
1266 1.1 dyoung *
1267 1.1 dyoung * return 0 on success, positive on failure
1268 1.1 dyoung **********************************************************************/
1269 1.1 dyoung #define IXGBE_MHADD_MFS_SHIFT 16
1270 1.1 dyoung
1271 1.1 dyoung static void
1272 1.1 dyoung ixgbe_init_locked(struct adapter *adapter)
1273 1.1 dyoung {
1274 1.1 dyoung struct ifnet *ifp = adapter->ifp;
1275 1.1 dyoung device_t dev = adapter->dev;
1276 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
1277 1.1 dyoung u32 k, txdctl, mhadd, gpie;
1278 1.1 dyoung u32 rxdctl, rxctrl;
1279 1.1 dyoung
1280 1.1 dyoung /* XXX check IFF_UP and IFF_RUNNING, power-saving state! */
1281 1.1 dyoung
1282 1.1 dyoung KASSERT(mutex_owned(&adapter->core_mtx));
1283 1.14.2.6 snj INIT_DEBUGOUT("ixgbe_init_locked: begin");
1284 1.1 dyoung hw->adapter_stopped = FALSE;
1285 1.1 dyoung ixgbe_stop_adapter(hw);
1286 1.1 dyoung callout_stop(&adapter->timer);
1287 1.1 dyoung
1288 1.1 dyoung /* XXX I moved this here from the SIOCSIFMTU case in ixgbe_ioctl(). */
1289 1.1 dyoung adapter->max_frame_size =
1290 1.1 dyoung ifp->if_mtu + ETHER_HDR_LEN + ETHER_CRC_LEN;
1291 1.1 dyoung
1292 1.1 dyoung /* reprogram the RAR[0] in case user changed it. */
1293 1.1 dyoung ixgbe_set_rar(hw, 0, adapter->hw.mac.addr, 0, IXGBE_RAH_AV);
1294 1.1 dyoung
1295 1.1 dyoung /* Get the latest mac address, User can use a LAA */
1296 1.1 dyoung memcpy(hw->mac.addr, CLLADDR(adapter->ifp->if_sadl),
1297 1.1 dyoung IXGBE_ETH_LENGTH_OF_ADDRESS);
1298 1.1 dyoung ixgbe_set_rar(hw, 0, hw->mac.addr, 0, 1);
1299 1.1 dyoung hw->addr_ctrl.rar_used_count = 1;
1300 1.1 dyoung
1301 1.1 dyoung /* Prepare transmit descriptors and buffers */
1302 1.1 dyoung if (ixgbe_setup_transmit_structures(adapter)) {
1303 1.1 dyoung device_printf(dev,"Could not setup transmit structures\n");
1304 1.1 dyoung ixgbe_stop(adapter);
1305 1.1 dyoung return;
1306 1.1 dyoung }
1307 1.1 dyoung
1308 1.1 dyoung ixgbe_init_hw(hw);
1309 1.1 dyoung ixgbe_initialize_transmit_units(adapter);
1310 1.1 dyoung
1311 1.1 dyoung /* Setup Multicast table */
1312 1.1 dyoung ixgbe_set_multi(adapter);
1313 1.1 dyoung
1314 1.1 dyoung /*
1315 1.1 dyoung ** Determine the correct mbuf pool
1316 1.14.2.4 riz ** for doing jumbo frames
1317 1.1 dyoung */
1318 1.1 dyoung if (adapter->max_frame_size <= 2048)
1319 1.1 dyoung adapter->rx_mbuf_sz = MCLBYTES;
1320 1.1 dyoung else if (adapter->max_frame_size <= 4096)
1321 1.1 dyoung adapter->rx_mbuf_sz = MJUMPAGESIZE;
1322 1.1 dyoung else if (adapter->max_frame_size <= 9216)
1323 1.1 dyoung adapter->rx_mbuf_sz = MJUM9BYTES;
1324 1.1 dyoung else
1325 1.1 dyoung adapter->rx_mbuf_sz = MJUM16BYTES;
1326 1.1 dyoung
1327 1.1 dyoung /* Prepare receive descriptors and buffers */
1328 1.1 dyoung if (ixgbe_setup_receive_structures(adapter)) {
1329 1.1 dyoung device_printf(dev,"Could not setup receive structures\n");
1330 1.1 dyoung ixgbe_stop(adapter);
1331 1.1 dyoung return;
1332 1.1 dyoung }
1333 1.1 dyoung
1334 1.1 dyoung /* Configure RX settings */
1335 1.1 dyoung ixgbe_initialize_receive_units(adapter);
1336 1.1 dyoung
1337 1.1 dyoung gpie = IXGBE_READ_REG(&adapter->hw, IXGBE_GPIE);
1338 1.1 dyoung
1339 1.1 dyoung /* Enable Fan Failure Interrupt */
1340 1.1 dyoung gpie |= IXGBE_SDP1_GPIEN;
1341 1.1 dyoung
1342 1.14.2.6 snj /* Add for Module detection */
1343 1.1 dyoung if (hw->mac.type == ixgbe_mac_82599EB)
1344 1.1 dyoung gpie |= IXGBE_SDP2_GPIEN;
1345 1.1 dyoung
1346 1.14.2.4 riz /* Thermal Failure Detection */
1347 1.14.2.4 riz if (hw->mac.type == ixgbe_mac_X540)
1348 1.14.2.4 riz gpie |= IXGBE_SDP0_GPIEN;
1349 1.14.2.4 riz
1350 1.1 dyoung if (adapter->msix > 1) {
1351 1.1 dyoung /* Enable Enhanced MSIX mode */
1352 1.1 dyoung gpie |= IXGBE_GPIE_MSIX_MODE;
1353 1.1 dyoung gpie |= IXGBE_GPIE_EIAME | IXGBE_GPIE_PBA_SUPPORT |
1354 1.1 dyoung IXGBE_GPIE_OCD;
1355 1.1 dyoung }
1356 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_GPIE, gpie);
1357 1.1 dyoung
1358 1.1 dyoung /* Set MTU size */
1359 1.1 dyoung if (ifp->if_mtu > ETHERMTU) {
1360 1.1 dyoung mhadd = IXGBE_READ_REG(hw, IXGBE_MHADD);
1361 1.1 dyoung mhadd &= ~IXGBE_MHADD_MFS_MASK;
1362 1.1 dyoung mhadd |= adapter->max_frame_size << IXGBE_MHADD_MFS_SHIFT;
1363 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_MHADD, mhadd);
1364 1.1 dyoung }
1365 1.1 dyoung
1366 1.1 dyoung /* Now enable all the queues */
1367 1.1 dyoung
1368 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++) {
1369 1.1 dyoung txdctl = IXGBE_READ_REG(hw, IXGBE_TXDCTL(i));
1370 1.1 dyoung txdctl |= IXGBE_TXDCTL_ENABLE;
1371 1.1 dyoung /* Set WTHRESH to 8, burst writeback */
1372 1.1 dyoung txdctl |= (8 << 16);
1373 1.14.2.4 riz /*
1374 1.14.2.4 riz * When the internal queue falls below PTHRESH (32),
1375 1.14.2.4 riz * start prefetching as long as there are at least
1376 1.14.2.4 riz * HTHRESH (1) buffers ready. The values are taken
1377 1.14.2.4 riz * from the Intel linux driver 3.8.21.
1378 1.14.2.4 riz * Prefetching enables tx line rate even with 1 queue.
1379 1.14.2.4 riz */
1380 1.14.2.4 riz txdctl |= (32 << 0) | (1 << 8);
1381 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_TXDCTL(i), txdctl);
1382 1.1 dyoung }
1383 1.1 dyoung
1384 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++) {
1385 1.1 dyoung rxdctl = IXGBE_READ_REG(hw, IXGBE_RXDCTL(i));
1386 1.1 dyoung if (hw->mac.type == ixgbe_mac_82598EB) {
1387 1.1 dyoung /*
1388 1.1 dyoung ** PTHRESH = 21
1389 1.1 dyoung ** HTHRESH = 4
1390 1.1 dyoung ** WTHRESH = 8
1391 1.1 dyoung */
1392 1.1 dyoung rxdctl &= ~0x3FFFFF;
1393 1.1 dyoung rxdctl |= 0x080420;
1394 1.1 dyoung }
1395 1.1 dyoung rxdctl |= IXGBE_RXDCTL_ENABLE;
1396 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RXDCTL(i), rxdctl);
1397 1.1 dyoung /* XXX I don't trust this loop, and I don't trust the
1398 1.1 dyoung * XXX memory barrier. What is this meant to do? --dyoung
1399 1.1 dyoung */
1400 1.1 dyoung for (k = 0; k < 10; k++) {
1401 1.1 dyoung if (IXGBE_READ_REG(hw, IXGBE_RXDCTL(i)) &
1402 1.1 dyoung IXGBE_RXDCTL_ENABLE)
1403 1.1 dyoung break;
1404 1.1 dyoung else
1405 1.1 dyoung msec_delay(1);
1406 1.1 dyoung }
1407 1.1 dyoung wmb();
1408 1.14.2.3 martin #ifdef DEV_NETMAP
1409 1.14.2.3 martin /*
1410 1.14.2.3 martin * In netmap mode, we must preserve the buffers made
1411 1.14.2.3 martin * available to userspace before the if_init()
1412 1.14.2.3 martin * (this is true by default on the TX side, because
1413 1.14.2.3 martin * init makes all buffers available to userspace).
1414 1.14.2.3 martin *
1415 1.14.2.3 martin * netmap_reset() and the device specific routines
1416 1.14.2.3 martin * (e.g. ixgbe_setup_receive_rings()) map these
1417 1.14.2.3 martin * buffers at the end of the NIC ring, so here we
1418 1.14.2.3 martin * must set the RDT (tail) register to make sure
1419 1.14.2.3 martin * they are not overwritten.
1420 1.14.2.3 martin *
1421 1.14.2.3 martin * In this driver the NIC ring starts at RDH = 0,
1422 1.14.2.3 martin * RDT points to the last slot available for reception (?),
1423 1.14.2.3 martin * so RDT = num_rx_desc - 1 means the whole ring is available.
1424 1.14.2.3 martin */
1425 1.14.2.3 martin if (ifp->if_capenable & IFCAP_NETMAP) {
1426 1.14.2.3 martin struct netmap_adapter *na = NA(adapter->ifp);
1427 1.14.2.3 martin struct netmap_kring *kring = &na->rx_rings[i];
1428 1.14.2.6 snj int t = na->num_rx_desc - 1 - nm_kr_rxspace(kring);
1429 1.14.2.3 martin
1430 1.14.2.3 martin IXGBE_WRITE_REG(hw, IXGBE_RDT(i), t);
1431 1.14.2.3 martin } else
1432 1.14.2.3 martin #endif /* DEV_NETMAP */
1433 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RDT(i), adapter->num_rx_desc - 1);
1434 1.1 dyoung }
1435 1.1 dyoung
1436 1.1 dyoung /* Enable Receive engine */
1437 1.1 dyoung rxctrl = IXGBE_READ_REG(hw, IXGBE_RXCTRL);
1438 1.1 dyoung if (hw->mac.type == ixgbe_mac_82598EB)
1439 1.1 dyoung rxctrl |= IXGBE_RXCTRL_DMBYPS;
1440 1.1 dyoung rxctrl |= IXGBE_RXCTRL_RXEN;
1441 1.1 dyoung ixgbe_enable_rx_dma(hw, rxctrl);
1442 1.1 dyoung
1443 1.1 dyoung callout_reset(&adapter->timer, hz, ixgbe_local_timer, adapter);
1444 1.1 dyoung
1445 1.1 dyoung /* Set up MSI/X routing */
1446 1.1 dyoung if (ixgbe_enable_msix) {
1447 1.1 dyoung ixgbe_configure_ivars(adapter);
1448 1.1 dyoung /* Set up auto-mask */
1449 1.1 dyoung if (hw->mac.type == ixgbe_mac_82598EB)
1450 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIAM, IXGBE_EICS_RTX_QUEUE);
1451 1.1 dyoung else {
1452 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIAM_EX(0), 0xFFFFFFFF);
1453 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIAM_EX(1), 0xFFFFFFFF);
1454 1.1 dyoung }
1455 1.1 dyoung } else { /* Simple settings for Legacy/MSI */
1456 1.1 dyoung ixgbe_set_ivar(adapter, 0, 0, 0);
1457 1.1 dyoung ixgbe_set_ivar(adapter, 0, 0, 1);
1458 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIAM, IXGBE_EICS_RTX_QUEUE);
1459 1.1 dyoung }
1460 1.1 dyoung
1461 1.1 dyoung #ifdef IXGBE_FDIR
1462 1.1 dyoung /* Init Flow director */
1463 1.14.2.4 riz if (hw->mac.type != ixgbe_mac_82598EB) {
1464 1.14.2.4 riz u32 hdrm = 32 << fdir_pballoc;
1465 1.14.2.4 riz
1466 1.14.2.4 riz hw->mac.ops.setup_rxpba(hw, 0, hdrm, PBA_STRATEGY_EQUAL);
1467 1.1 dyoung ixgbe_init_fdir_signature_82599(&adapter->hw, fdir_pballoc);
1468 1.14.2.4 riz }
1469 1.1 dyoung #endif
1470 1.1 dyoung
1471 1.1 dyoung /*
1472 1.1 dyoung ** Check on any SFP devices that
1473 1.1 dyoung ** need to be kick-started
1474 1.1 dyoung */
1475 1.1 dyoung if (hw->phy.type == ixgbe_phy_none) {
1476 1.1 dyoung int err = hw->phy.ops.identify(hw);
1477 1.1 dyoung if (err == IXGBE_ERR_SFP_NOT_SUPPORTED) {
1478 1.1 dyoung device_printf(dev,
1479 1.1 dyoung "Unsupported SFP+ module type was detected.\n");
1480 1.1 dyoung return;
1481 1.1 dyoung }
1482 1.1 dyoung }
1483 1.1 dyoung
1484 1.1 dyoung /* Set moderation on the Link interrupt */
1485 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EITR(adapter->linkvec), IXGBE_LINK_ITR);
1486 1.1 dyoung
1487 1.1 dyoung /* Config/Enable Link */
1488 1.1 dyoung ixgbe_config_link(adapter);
1489 1.1 dyoung
1490 1.14.2.4 riz /* Hardware Packet Buffer & Flow Control setup */
1491 1.14.2.4 riz {
1492 1.14.2.4 riz u32 rxpb, frame, size, tmp;
1493 1.14.2.4 riz
1494 1.14.2.4 riz frame = adapter->max_frame_size;
1495 1.14.2.4 riz
1496 1.14.2.4 riz /* Calculate High Water */
1497 1.14.2.4 riz if (hw->mac.type == ixgbe_mac_X540)
1498 1.14.2.4 riz tmp = IXGBE_DV_X540(frame, frame);
1499 1.14.2.4 riz else
1500 1.14.2.4 riz tmp = IXGBE_DV(frame, frame);
1501 1.14.2.4 riz size = IXGBE_BT2KB(tmp);
1502 1.14.2.4 riz rxpb = IXGBE_READ_REG(hw, IXGBE_RXPBSIZE(0)) >> 10;
1503 1.14.2.4 riz hw->fc.high_water[0] = rxpb - size;
1504 1.14.2.4 riz
1505 1.14.2.4 riz /* Now calculate Low Water */
1506 1.14.2.4 riz if (hw->mac.type == ixgbe_mac_X540)
1507 1.14.2.4 riz tmp = IXGBE_LOW_DV_X540(frame);
1508 1.14.2.4 riz else
1509 1.14.2.4 riz tmp = IXGBE_LOW_DV(frame);
1510 1.14.2.4 riz hw->fc.low_water[0] = IXGBE_BT2KB(tmp);
1511 1.14.2.4 riz
1512 1.14.2.5 riz hw->fc.requested_mode = adapter->fc;
1513 1.14.2.4 riz hw->fc.pause_time = IXGBE_FC_PAUSE;
1514 1.14.2.4 riz hw->fc.send_xon = TRUE;
1515 1.14.2.4 riz }
1516 1.14.2.4 riz /* Initialize the FC settings */
1517 1.14.2.4 riz ixgbe_start_hw(hw);
1518 1.14.2.4 riz
1519 1.14.2.6 snj /* Set up VLAN support and filter */
1520 1.14.2.6 snj ixgbe_setup_vlan_hw_support(adapter);
1521 1.14.2.6 snj
1522 1.1 dyoung /* And now turn on interrupts */
1523 1.1 dyoung ixgbe_enable_intr(adapter);
1524 1.1 dyoung
1525 1.1 dyoung /* Now inform the stack we're ready */
1526 1.1 dyoung ifp->if_flags |= IFF_RUNNING;
1527 1.1 dyoung
1528 1.1 dyoung return;
1529 1.1 dyoung }
1530 1.1 dyoung
1531 1.1 dyoung static int
1532 1.1 dyoung ixgbe_init(struct ifnet *ifp)
1533 1.1 dyoung {
1534 1.1 dyoung struct adapter *adapter = ifp->if_softc;
1535 1.1 dyoung
1536 1.1 dyoung IXGBE_CORE_LOCK(adapter);
1537 1.1 dyoung ixgbe_init_locked(adapter);
1538 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
1539 1.1 dyoung return 0; /* XXX ixgbe_init_locked cannot fail? really? */
1540 1.1 dyoung }
1541 1.1 dyoung
1542 1.1 dyoung
1543 1.1 dyoung /*
1544 1.1 dyoung **
1545 1.1 dyoung ** MSIX Interrupt Handlers and Tasklets
1546 1.1 dyoung **
1547 1.1 dyoung */
1548 1.1 dyoung
1549 1.1 dyoung static inline void
1550 1.1 dyoung ixgbe_enable_queue(struct adapter *adapter, u32 vector)
1551 1.1 dyoung {
1552 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
1553 1.13 christos u64 queue = (u64)(1ULL << vector);
1554 1.1 dyoung u32 mask;
1555 1.1 dyoung
1556 1.1 dyoung if (hw->mac.type == ixgbe_mac_82598EB) {
1557 1.1 dyoung mask = (IXGBE_EIMS_RTX_QUEUE & queue);
1558 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIMS, mask);
1559 1.1 dyoung } else {
1560 1.1 dyoung mask = (queue & 0xFFFFFFFF);
1561 1.1 dyoung if (mask)
1562 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIMS_EX(0), mask);
1563 1.1 dyoung mask = (queue >> 32);
1564 1.1 dyoung if (mask)
1565 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIMS_EX(1), mask);
1566 1.1 dyoung }
1567 1.1 dyoung }
1568 1.1 dyoung
1569 1.11 joerg __unused static inline void
1570 1.1 dyoung ixgbe_disable_queue(struct adapter *adapter, u32 vector)
1571 1.1 dyoung {
1572 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
1573 1.13 christos u64 queue = (u64)(1ULL << vector);
1574 1.1 dyoung u32 mask;
1575 1.1 dyoung
1576 1.1 dyoung if (hw->mac.type == ixgbe_mac_82598EB) {
1577 1.1 dyoung mask = (IXGBE_EIMS_RTX_QUEUE & queue);
1578 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIMC, mask);
1579 1.1 dyoung } else {
1580 1.1 dyoung mask = (queue & 0xFFFFFFFF);
1581 1.1 dyoung if (mask)
1582 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIMC_EX(0), mask);
1583 1.1 dyoung mask = (queue >> 32);
1584 1.1 dyoung if (mask)
1585 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIMC_EX(1), mask);
1586 1.1 dyoung }
1587 1.1 dyoung }
1588 1.1 dyoung
1589 1.1 dyoung static void
1590 1.1 dyoung ixgbe_handle_que(void *context)
1591 1.1 dyoung {
1592 1.1 dyoung struct ix_queue *que = context;
1593 1.1 dyoung struct adapter *adapter = que->adapter;
1594 1.1 dyoung struct tx_ring *txr = que->txr;
1595 1.1 dyoung struct ifnet *ifp = adapter->ifp;
1596 1.1 dyoung
1597 1.1 dyoung adapter->handleq.ev_count++;
1598 1.1 dyoung
1599 1.1 dyoung if (ifp->if_flags & IFF_RUNNING) {
1600 1.14.2.6 snj ixgbe_rxeof(que);
1601 1.1 dyoung IXGBE_TX_LOCK(txr);
1602 1.1 dyoung ixgbe_txeof(txr);
1603 1.14.2.5 riz #ifndef IXGBE_LEGACY_TX
1604 1.1 dyoung if (!drbr_empty(ifp, txr->br))
1605 1.14.2.6 snj ixgbe_mq_start_locked(ifp, txr);
1606 1.1 dyoung #else
1607 1.1 dyoung if (!IFQ_IS_EMPTY(&ifp->if_snd))
1608 1.1 dyoung ixgbe_start_locked(txr, ifp);
1609 1.1 dyoung #endif
1610 1.1 dyoung IXGBE_TX_UNLOCK(txr);
1611 1.1 dyoung }
1612 1.1 dyoung
1613 1.1 dyoung /* Reenable this interrupt */
1614 1.14.2.6 snj if (que->res != NULL)
1615 1.14.2.6 snj ixgbe_enable_queue(adapter, que->msix);
1616 1.14.2.6 snj else
1617 1.14.2.6 snj ixgbe_enable_intr(adapter);
1618 1.1 dyoung return;
1619 1.1 dyoung }
1620 1.1 dyoung
1621 1.1 dyoung
1622 1.1 dyoung /*********************************************************************
1623 1.1 dyoung *
1624 1.1 dyoung * Legacy Interrupt Service routine
1625 1.1 dyoung *
1626 1.1 dyoung **********************************************************************/
1627 1.1 dyoung
1628 1.1 dyoung static int
1629 1.1 dyoung ixgbe_legacy_irq(void *arg)
1630 1.1 dyoung {
1631 1.1 dyoung struct ix_queue *que = arg;
1632 1.1 dyoung struct adapter *adapter = que->adapter;
1633 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
1634 1.14.2.6 snj struct ifnet *ifp = adapter->ifp;
1635 1.1 dyoung struct tx_ring *txr = adapter->tx_rings;
1636 1.14.2.6 snj bool more = false;
1637 1.14.2.6 snj u32 reg_eicr;
1638 1.14.2.6 snj
1639 1.1 dyoung
1640 1.1 dyoung reg_eicr = IXGBE_READ_REG(hw, IXGBE_EICR);
1641 1.1 dyoung
1642 1.1 dyoung adapter->stats.legint.ev_count++;
1643 1.1 dyoung ++que->irqs;
1644 1.1 dyoung if (reg_eicr == 0) {
1645 1.1 dyoung adapter->stats.intzero.ev_count++;
1646 1.14.2.1 martin if ((ifp->if_flags & IFF_UP) != 0)
1647 1.14.2.1 martin ixgbe_enable_intr(adapter);
1648 1.1 dyoung return 0;
1649 1.1 dyoung }
1650 1.1 dyoung
1651 1.14.2.1 martin if ((ifp->if_flags & IFF_RUNNING) != 0) {
1652 1.14.2.6 snj more = ixgbe_rxeof(que);
1653 1.1 dyoung
1654 1.14.2.1 martin IXGBE_TX_LOCK(txr);
1655 1.14.2.6 snj ixgbe_txeof(txr);
1656 1.14.2.6 snj #ifdef IXGBE_LEGACY_TX
1657 1.14.2.6 snj if (!IFQ_IS_EMPTY(&ifp->if_snd))
1658 1.14.2.6 snj ixgbe_start_locked(txr, ifp);
1659 1.14.2.6 snj #else
1660 1.14.2.6 snj if (!drbr_empty(ifp, txr->br))
1661 1.14.2.6 snj ixgbe_mq_start_locked(ifp, txr);
1662 1.14.2.6 snj #endif
1663 1.14.2.1 martin IXGBE_TX_UNLOCK(txr);
1664 1.14.2.1 martin }
1665 1.1 dyoung
1666 1.1 dyoung /* Check for fan failure */
1667 1.1 dyoung if ((hw->phy.media_type == ixgbe_media_type_copper) &&
1668 1.1 dyoung (reg_eicr & IXGBE_EICR_GPI_SDP1)) {
1669 1.1 dyoung device_printf(adapter->dev, "\nCRITICAL: FAN FAILURE!! "
1670 1.1 dyoung "REPLACE IMMEDIATELY!!\n");
1671 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIMS, IXGBE_EICR_GPI_SDP1);
1672 1.1 dyoung }
1673 1.1 dyoung
1674 1.1 dyoung /* Link status change */
1675 1.1 dyoung if (reg_eicr & IXGBE_EICR_LSC)
1676 1.1 dyoung softint_schedule(adapter->link_si);
1677 1.1 dyoung
1678 1.14.2.6 snj if (more)
1679 1.14.2.6 snj #ifndef IXGBE_LEGACY_TX
1680 1.14.2.6 snj softint_schedule(txr->txq_si);
1681 1.14.2.6 snj #else
1682 1.14.2.6 snj softint_schedule(que->que_si);
1683 1.14.2.6 snj #endif
1684 1.14.2.6 snj else
1685 1.14.2.6 snj ixgbe_enable_intr(adapter);
1686 1.1 dyoung return 1;
1687 1.1 dyoung }
1688 1.1 dyoung
1689 1.1 dyoung
1690 1.1 dyoung #if defined(NETBSD_MSI_OR_MSIX)
1691 1.1 dyoung /*********************************************************************
1692 1.1 dyoung *
1693 1.14.2.3 martin * MSIX Queue Interrupt Service routine
1694 1.1 dyoung *
1695 1.1 dyoung **********************************************************************/
1696 1.1 dyoung void
1697 1.1 dyoung ixgbe_msix_que(void *arg)
1698 1.1 dyoung {
1699 1.1 dyoung struct ix_queue *que = arg;
1700 1.1 dyoung struct adapter *adapter = que->adapter;
1701 1.14.2.6 snj struct ifnet *ifp = adapter->ifp;
1702 1.1 dyoung struct tx_ring *txr = que->txr;
1703 1.1 dyoung struct rx_ring *rxr = que->rxr;
1704 1.14.2.6 snj bool more;
1705 1.1 dyoung u32 newitr = 0;
1706 1.1 dyoung
1707 1.14.2.6 snj /* Protect against spurious interrupts */
1708 1.14.2.6 snj if ((ifp->if_flags & IFF_RUNNING) == 0)
1709 1.14.2.6 snj return;
1710 1.14.2.6 snj
1711 1.14.2.4 riz ixgbe_disable_queue(adapter, que->msix);
1712 1.1 dyoung ++que->irqs;
1713 1.1 dyoung
1714 1.14.2.6 snj more = ixgbe_rxeof(que);
1715 1.1 dyoung
1716 1.1 dyoung IXGBE_TX_LOCK(txr);
1717 1.14.2.6 snj ixgbe_txeof(txr);
1718 1.14.2.5 riz #ifdef IXGBE_LEGACY_TX
1719 1.14.2.4 riz if (!IFQ_IS_EMPTY(&adapter->ifp->if_snd))
1720 1.14.2.3 martin #else
1721 1.14.2.6 snj if (!drbr_empty(ifp, txr->br))
1722 1.14.2.6 snj ixgbe_mq_start_locked(ifp, txr);
1723 1.14.2.3 martin #endif
1724 1.1 dyoung IXGBE_TX_UNLOCK(txr);
1725 1.1 dyoung
1726 1.1 dyoung /* Do AIM now? */
1727 1.1 dyoung
1728 1.1 dyoung if (ixgbe_enable_aim == FALSE)
1729 1.1 dyoung goto no_calc;
1730 1.1 dyoung /*
1731 1.1 dyoung ** Do Adaptive Interrupt Moderation:
1732 1.1 dyoung ** - Write out last calculated setting
1733 1.1 dyoung ** - Calculate based on average size over
1734 1.1 dyoung ** the last interval.
1735 1.1 dyoung */
1736 1.1 dyoung if (que->eitr_setting)
1737 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw,
1738 1.1 dyoung IXGBE_EITR(que->msix), que->eitr_setting);
1739 1.1 dyoung
1740 1.1 dyoung que->eitr_setting = 0;
1741 1.1 dyoung
1742 1.1 dyoung /* Idle, do nothing */
1743 1.1 dyoung if ((txr->bytes == 0) && (rxr->bytes == 0))
1744 1.1 dyoung goto no_calc;
1745 1.1 dyoung
1746 1.1 dyoung if ((txr->bytes) && (txr->packets))
1747 1.1 dyoung newitr = txr->bytes/txr->packets;
1748 1.1 dyoung if ((rxr->bytes) && (rxr->packets))
1749 1.1 dyoung newitr = max(newitr,
1750 1.1 dyoung (rxr->bytes / rxr->packets));
1751 1.1 dyoung newitr += 24; /* account for hardware frame, crc */
1752 1.1 dyoung
1753 1.1 dyoung /* set an upper boundary */
1754 1.1 dyoung newitr = min(newitr, 3000);
1755 1.1 dyoung
1756 1.1 dyoung /* Be nice to the mid range */
1757 1.1 dyoung if ((newitr > 300) && (newitr < 1200))
1758 1.1 dyoung newitr = (newitr / 3);
1759 1.1 dyoung else
1760 1.1 dyoung newitr = (newitr / 2);
1761 1.1 dyoung
1762 1.1 dyoung if (adapter->hw.mac.type == ixgbe_mac_82598EB)
1763 1.1 dyoung newitr |= newitr << 16;
1764 1.1 dyoung else
1765 1.1 dyoung newitr |= IXGBE_EITR_CNT_WDIS;
1766 1.1 dyoung
1767 1.1 dyoung /* save for next interrupt */
1768 1.1 dyoung que->eitr_setting = newitr;
1769 1.1 dyoung
1770 1.1 dyoung /* Reset state */
1771 1.1 dyoung txr->bytes = 0;
1772 1.1 dyoung txr->packets = 0;
1773 1.1 dyoung rxr->bytes = 0;
1774 1.1 dyoung rxr->packets = 0;
1775 1.1 dyoung
1776 1.1 dyoung no_calc:
1777 1.14.2.6 snj if (more)
1778 1.1 dyoung softint_schedule(que->que_si);
1779 1.14.2.6 snj else
1780 1.1 dyoung ixgbe_enable_queue(adapter, que->msix);
1781 1.1 dyoung return;
1782 1.1 dyoung }
1783 1.1 dyoung
1784 1.1 dyoung
1785 1.1 dyoung static void
1786 1.1 dyoung ixgbe_msix_link(void *arg)
1787 1.1 dyoung {
1788 1.1 dyoung struct adapter *adapter = arg;
1789 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
1790 1.1 dyoung u32 reg_eicr;
1791 1.1 dyoung
1792 1.1 dyoung ++adapter->link_irq.ev_count;
1793 1.1 dyoung
1794 1.1 dyoung /* First get the cause */
1795 1.1 dyoung reg_eicr = IXGBE_READ_REG(hw, IXGBE_EICS);
1796 1.14.2.6 snj /* Be sure the queue bits are not cleared */
1797 1.14.2.6 snj reg_eicr &= ~IXGBE_EICR_RTX_QUEUE;
1798 1.1 dyoung /* Clear interrupt with write */
1799 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EICR, reg_eicr);
1800 1.1 dyoung
1801 1.1 dyoung /* Link status change */
1802 1.1 dyoung if (reg_eicr & IXGBE_EICR_LSC)
1803 1.1 dyoung softint_schedule(adapter->link_si);
1804 1.1 dyoung
1805 1.1 dyoung if (adapter->hw.mac.type != ixgbe_mac_82598EB) {
1806 1.1 dyoung #ifdef IXGBE_FDIR
1807 1.1 dyoung if (reg_eicr & IXGBE_EICR_FLOW_DIR) {
1808 1.1 dyoung /* This is probably overkill :) */
1809 1.1 dyoung if (!atomic_cmpset_int(&adapter->fdir_reinit, 0, 1))
1810 1.1 dyoung return;
1811 1.14.2.4 riz /* Disable the interrupt */
1812 1.14.2.4 riz IXGBE_WRITE_REG(hw, IXGBE_EIMC, IXGBE_EICR_FLOW_DIR);
1813 1.1 dyoung softint_schedule(adapter->fdir_si);
1814 1.1 dyoung } else
1815 1.1 dyoung #endif
1816 1.1 dyoung if (reg_eicr & IXGBE_EICR_ECC) {
1817 1.1 dyoung device_printf(adapter->dev, "\nCRITICAL: ECC ERROR!! "
1818 1.1 dyoung "Please Reboot!!\n");
1819 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EICR, IXGBE_EICR_ECC);
1820 1.1 dyoung } else
1821 1.1 dyoung
1822 1.1 dyoung if (reg_eicr & IXGBE_EICR_GPI_SDP1) {
1823 1.1 dyoung /* Clear the interrupt */
1824 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EICR, IXGBE_EICR_GPI_SDP1);
1825 1.1 dyoung softint_schedule(adapter->msf_si);
1826 1.1 dyoung } else if (reg_eicr & IXGBE_EICR_GPI_SDP2) {
1827 1.1 dyoung /* Clear the interrupt */
1828 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EICR, IXGBE_EICR_GPI_SDP2);
1829 1.1 dyoung softint_schedule(adapter->mod_si);
1830 1.1 dyoung }
1831 1.1 dyoung }
1832 1.1 dyoung
1833 1.1 dyoung /* Check for fan failure */
1834 1.1 dyoung if ((hw->device_id == IXGBE_DEV_ID_82598AT) &&
1835 1.1 dyoung (reg_eicr & IXGBE_EICR_GPI_SDP1)) {
1836 1.1 dyoung device_printf(adapter->dev, "\nCRITICAL: FAN FAILURE!! "
1837 1.1 dyoung "REPLACE IMMEDIATELY!!\n");
1838 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EICR, IXGBE_EICR_GPI_SDP1);
1839 1.1 dyoung }
1840 1.1 dyoung
1841 1.14.2.4 riz /* Check for over temp condition */
1842 1.14.2.4 riz if ((hw->mac.type == ixgbe_mac_X540) &&
1843 1.14.2.5 riz (reg_eicr & IXGBE_EICR_TS)) {
1844 1.14.2.4 riz device_printf(adapter->dev, "\nCRITICAL: OVER TEMP!! "
1845 1.14.2.4 riz "PHY IS SHUT DOWN!!\n");
1846 1.14.2.4 riz device_printf(adapter->dev, "System shutdown required\n");
1847 1.14.2.5 riz IXGBE_WRITE_REG(hw, IXGBE_EICR, IXGBE_EICR_TS);
1848 1.14.2.4 riz }
1849 1.14.2.4 riz
1850 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_EIMS, IXGBE_EIMS_OTHER);
1851 1.1 dyoung return;
1852 1.1 dyoung }
1853 1.1 dyoung #endif
1854 1.1 dyoung
1855 1.1 dyoung /*********************************************************************
1856 1.1 dyoung *
1857 1.1 dyoung * Media Ioctl callback
1858 1.1 dyoung *
1859 1.1 dyoung * This routine is called whenever the user queries the status of
1860 1.1 dyoung * the interface using ifconfig.
1861 1.1 dyoung *
1862 1.1 dyoung **********************************************************************/
1863 1.1 dyoung static void
1864 1.1 dyoung ixgbe_media_status(struct ifnet * ifp, struct ifmediareq * ifmr)
1865 1.1 dyoung {
1866 1.1 dyoung struct adapter *adapter = ifp->if_softc;
1867 1.14.2.6 snj struct ixgbe_hw *hw = &adapter->hw;
1868 1.1 dyoung
1869 1.1 dyoung INIT_DEBUGOUT("ixgbe_media_status: begin");
1870 1.1 dyoung IXGBE_CORE_LOCK(adapter);
1871 1.1 dyoung ixgbe_update_link_status(adapter);
1872 1.1 dyoung
1873 1.1 dyoung ifmr->ifm_status = IFM_AVALID;
1874 1.1 dyoung ifmr->ifm_active = IFM_ETHER;
1875 1.1 dyoung
1876 1.1 dyoung if (!adapter->link_active) {
1877 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
1878 1.1 dyoung return;
1879 1.1 dyoung }
1880 1.1 dyoung
1881 1.1 dyoung ifmr->ifm_status |= IFM_ACTIVE;
1882 1.1 dyoung
1883 1.14.2.6 snj /*
1884 1.14.2.6 snj * Not all NIC are 1000baseSX as an example X540T.
1885 1.14.2.6 snj * We must set properly the media based on NIC model.
1886 1.14.2.6 snj */
1887 1.14.2.6 snj switch (hw->device_id) {
1888 1.14.2.6 snj case IXGBE_DEV_ID_X540T:
1889 1.14.2.6 snj if (adapter->link_speed == IXGBE_LINK_SPEED_100_FULL)
1890 1.14.2.4 riz ifmr->ifm_active |= IFM_100_TX | IFM_FDX;
1891 1.14.2.6 snj else if (adapter->link_speed == IXGBE_LINK_SPEED_1GB_FULL)
1892 1.14.2.6 snj ifmr->ifm_active |= IFM_1000_T | IFM_FDX;
1893 1.14.2.6 snj else if (adapter->link_speed == IXGBE_LINK_SPEED_10GB_FULL)
1894 1.14.2.6 snj ifmr->ifm_active |= adapter->optics | IFM_FDX;
1895 1.14.2.6 snj break;
1896 1.14.2.6 snj default:
1897 1.14.2.6 snj if (adapter->link_speed == IXGBE_LINK_SPEED_100_FULL)
1898 1.14.2.6 snj ifmr->ifm_active |= IFM_100_TX | IFM_FDX;
1899 1.14.2.6 snj else if (adapter->link_speed == IXGBE_LINK_SPEED_1GB_FULL)
1900 1.14.2.5 riz ifmr->ifm_active |= IFM_1000_SX | IFM_FDX;
1901 1.14.2.6 snj else if (adapter->link_speed == IXGBE_LINK_SPEED_10GB_FULL)
1902 1.1 dyoung ifmr->ifm_active |= adapter->optics | IFM_FDX;
1903 1.14.2.6 snj break;
1904 1.1 dyoung }
1905 1.1 dyoung
1906 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
1907 1.1 dyoung
1908 1.1 dyoung return;
1909 1.1 dyoung }
1910 1.1 dyoung
1911 1.1 dyoung /*********************************************************************
1912 1.1 dyoung *
1913 1.1 dyoung * Media Ioctl callback
1914 1.1 dyoung *
1915 1.1 dyoung * This routine is called when the user changes speed/duplex using
1916 1.1 dyoung * media/mediopt option with ifconfig.
1917 1.1 dyoung *
1918 1.1 dyoung **********************************************************************/
1919 1.1 dyoung static int
1920 1.1 dyoung ixgbe_media_change(struct ifnet * ifp)
1921 1.1 dyoung {
1922 1.1 dyoung struct adapter *adapter = ifp->if_softc;
1923 1.1 dyoung struct ifmedia *ifm = &adapter->media;
1924 1.1 dyoung
1925 1.1 dyoung INIT_DEBUGOUT("ixgbe_media_change: begin");
1926 1.1 dyoung
1927 1.1 dyoung if (IFM_TYPE(ifm->ifm_media) != IFM_ETHER)
1928 1.1 dyoung return (EINVAL);
1929 1.1 dyoung
1930 1.1 dyoung switch (IFM_SUBTYPE(ifm->ifm_media)) {
1931 1.14.2.6 snj case IFM_10G_T:
1932 1.14.2.6 snj case IFM_AUTO:
1933 1.14.2.6 snj adapter->hw.phy.autoneg_advertised =
1934 1.14.2.4 riz IXGBE_LINK_SPEED_100_FULL |
1935 1.14.2.4 riz IXGBE_LINK_SPEED_1GB_FULL |
1936 1.14.2.4 riz IXGBE_LINK_SPEED_10GB_FULL;
1937 1.1 dyoung break;
1938 1.1 dyoung default:
1939 1.1 dyoung device_printf(adapter->dev, "Only auto media type\n");
1940 1.1 dyoung return (EINVAL);
1941 1.1 dyoung }
1942 1.1 dyoung
1943 1.1 dyoung return (0);
1944 1.1 dyoung }
1945 1.1 dyoung
1946 1.1 dyoung /*********************************************************************
1947 1.1 dyoung *
1948 1.1 dyoung * This routine maps the mbufs to tx descriptors, allowing the
1949 1.1 dyoung * TX engine to transmit the packets.
1950 1.1 dyoung * - return 0 on success, positive on failure
1951 1.1 dyoung *
1952 1.1 dyoung **********************************************************************/
1953 1.1 dyoung
1954 1.1 dyoung static int
1955 1.1 dyoung ixgbe_xmit(struct tx_ring *txr, struct mbuf *m_head)
1956 1.1 dyoung {
1957 1.1 dyoung struct m_tag *mtag;
1958 1.1 dyoung struct adapter *adapter = txr->adapter;
1959 1.1 dyoung struct ethercom *ec = &adapter->osdep.ec;
1960 1.1 dyoung u32 olinfo_status = 0, cmd_type_len;
1961 1.1 dyoung int i, j, error;
1962 1.14.2.5 riz int first;
1963 1.1 dyoung bus_dmamap_t map;
1964 1.9 skrll struct ixgbe_tx_buf *txbuf;
1965 1.1 dyoung union ixgbe_adv_tx_desc *txd = NULL;
1966 1.1 dyoung
1967 1.1 dyoung /* Basic descriptor defines */
1968 1.1 dyoung cmd_type_len = (IXGBE_ADVTXD_DTYP_DATA |
1969 1.1 dyoung IXGBE_ADVTXD_DCMD_IFCS | IXGBE_ADVTXD_DCMD_DEXT);
1970 1.1 dyoung
1971 1.1 dyoung if ((mtag = VLAN_OUTPUT_TAG(ec, m_head)) != NULL)
1972 1.1 dyoung cmd_type_len |= IXGBE_ADVTXD_DCMD_VLE;
1973 1.1 dyoung
1974 1.1 dyoung /*
1975 1.1 dyoung * Important to capture the first descriptor
1976 1.1 dyoung * used because it will contain the index of
1977 1.1 dyoung * the one we tell the hardware to report back
1978 1.1 dyoung */
1979 1.1 dyoung first = txr->next_avail_desc;
1980 1.1 dyoung txbuf = &txr->tx_buffers[first];
1981 1.1 dyoung map = txbuf->map;
1982 1.1 dyoung
1983 1.1 dyoung /*
1984 1.1 dyoung * Map the packet for DMA.
1985 1.1 dyoung */
1986 1.1 dyoung error = bus_dmamap_load_mbuf(txr->txtag->dt_dmat, map,
1987 1.1 dyoung m_head, BUS_DMA_NOWAIT);
1988 1.1 dyoung
1989 1.14.2.5 riz if (__predict_false(error)) {
1990 1.14.2.5 riz
1991 1.14.2.5 riz switch (error) {
1992 1.14.2.5 riz case EAGAIN:
1993 1.14.2.5 riz adapter->eagain_tx_dma_setup.ev_count++;
1994 1.14.2.5 riz return EAGAIN;
1995 1.14.2.5 riz case ENOMEM:
1996 1.14.2.5 riz adapter->enomem_tx_dma_setup.ev_count++;
1997 1.14.2.5 riz return EAGAIN;
1998 1.14.2.5 riz case EFBIG:
1999 1.14.2.5 riz /*
2000 1.14.2.5 riz * XXX Try it again?
2001 1.14.2.5 riz * do m_defrag() and retry bus_dmamap_load_mbuf().
2002 1.14.2.5 riz */
2003 1.14.2.5 riz adapter->efbig_tx_dma_setup.ev_count++;
2004 1.14.2.5 riz return error;
2005 1.14.2.5 riz case EINVAL:
2006 1.14.2.5 riz adapter->einval_tx_dma_setup.ev_count++;
2007 1.14.2.5 riz return error;
2008 1.14.2.5 riz default:
2009 1.14.2.5 riz adapter->other_tx_dma_setup.ev_count++;
2010 1.14.2.5 riz return error;
2011 1.14.2.5 riz }
2012 1.1 dyoung }
2013 1.1 dyoung
2014 1.1 dyoung /* Make certain there are enough descriptors */
2015 1.1 dyoung if (map->dm_nsegs > txr->tx_avail - 2) {
2016 1.1 dyoung txr->no_desc_avail.ev_count++;
2017 1.1 dyoung ixgbe_dmamap_unload(txr->txtag, txbuf->map);
2018 1.1 dyoung return EAGAIN;
2019 1.1 dyoung }
2020 1.1 dyoung
2021 1.1 dyoung /*
2022 1.1 dyoung ** Set up the appropriate offload context
2023 1.14.2.5 riz ** this will consume the first descriptor
2024 1.1 dyoung */
2025 1.14.2.5 riz error = ixgbe_tx_ctx_setup(txr, m_head, &cmd_type_len, &olinfo_status);
2026 1.14.2.5 riz if (__predict_false(error)) {
2027 1.14.2.5 riz return (error);
2028 1.14.2.5 riz }
2029 1.1 dyoung
2030 1.1 dyoung #ifdef IXGBE_FDIR
2031 1.1 dyoung /* Do the flow director magic */
2032 1.1 dyoung if ((txr->atr_sample) && (!adapter->fdir_reinit)) {
2033 1.1 dyoung ++txr->atr_count;
2034 1.1 dyoung if (txr->atr_count >= atr_sample_rate) {
2035 1.1 dyoung ixgbe_atr(txr, m_head);
2036 1.1 dyoung txr->atr_count = 0;
2037 1.1 dyoung }
2038 1.1 dyoung }
2039 1.1 dyoung #endif
2040 1.1 dyoung
2041 1.1 dyoung i = txr->next_avail_desc;
2042 1.1 dyoung for (j = 0; j < map->dm_nsegs; j++) {
2043 1.1 dyoung bus_size_t seglen;
2044 1.1 dyoung bus_addr_t segaddr;
2045 1.1 dyoung
2046 1.1 dyoung txbuf = &txr->tx_buffers[i];
2047 1.1 dyoung txd = &txr->tx_base[i];
2048 1.1 dyoung seglen = map->dm_segs[j].ds_len;
2049 1.1 dyoung segaddr = htole64(map->dm_segs[j].ds_addr);
2050 1.1 dyoung
2051 1.1 dyoung txd->read.buffer_addr = segaddr;
2052 1.1 dyoung txd->read.cmd_type_len = htole32(txr->txd_cmd |
2053 1.1 dyoung cmd_type_len |seglen);
2054 1.1 dyoung txd->read.olinfo_status = htole32(olinfo_status);
2055 1.1 dyoung
2056 1.14.2.5 riz if (++i == txr->num_desc)
2057 1.1 dyoung i = 0;
2058 1.1 dyoung }
2059 1.1 dyoung
2060 1.1 dyoung txd->read.cmd_type_len |=
2061 1.1 dyoung htole32(IXGBE_TXD_CMD_EOP | IXGBE_TXD_CMD_RS);
2062 1.1 dyoung txr->tx_avail -= map->dm_nsegs;
2063 1.1 dyoung txr->next_avail_desc = i;
2064 1.1 dyoung
2065 1.1 dyoung txbuf->m_head = m_head;
2066 1.14.2.5 riz /*
2067 1.14.2.5 riz ** Here we swap the map so the last descriptor,
2068 1.14.2.5 riz ** which gets the completion interrupt has the
2069 1.14.2.5 riz ** real map, and the first descriptor gets the
2070 1.14.2.5 riz ** unused map from this descriptor.
2071 1.14.2.5 riz */
2072 1.1 dyoung txr->tx_buffers[first].map = txbuf->map;
2073 1.1 dyoung txbuf->map = map;
2074 1.1 dyoung bus_dmamap_sync(txr->txtag->dt_dmat, map, 0, m_head->m_pkthdr.len,
2075 1.1 dyoung BUS_DMASYNC_PREWRITE);
2076 1.1 dyoung
2077 1.14.2.5 riz /* Set the EOP descriptor that will be marked done */
2078 1.1 dyoung txbuf = &txr->tx_buffers[first];
2079 1.14.2.5 riz txbuf->eop = txd;
2080 1.1 dyoung
2081 1.1 dyoung ixgbe_dmamap_sync(txr->txdma.dma_tag, txr->txdma.dma_map,
2082 1.1 dyoung BUS_DMASYNC_PREREAD | BUS_DMASYNC_PREWRITE);
2083 1.1 dyoung /*
2084 1.1 dyoung * Advance the Transmit Descriptor Tail (Tdt), this tells the
2085 1.1 dyoung * hardware that this frame is available to transmit.
2086 1.1 dyoung */
2087 1.1 dyoung ++txr->total_packets.ev_count;
2088 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_TDT(txr->me), i);
2089 1.1 dyoung
2090 1.1 dyoung return 0;
2091 1.1 dyoung }
2092 1.1 dyoung
2093 1.1 dyoung static void
2094 1.1 dyoung ixgbe_set_promisc(struct adapter *adapter)
2095 1.1 dyoung {
2096 1.14.2.5 riz struct ether_multi *enm;
2097 1.14.2.5 riz struct ether_multistep step;
2098 1.1 dyoung u_int32_t reg_rctl;
2099 1.14.2.5 riz struct ethercom *ec = &adapter->osdep.ec;
2100 1.1 dyoung struct ifnet *ifp = adapter->ifp;
2101 1.14.2.5 riz int mcnt = 0;
2102 1.1 dyoung
2103 1.1 dyoung reg_rctl = IXGBE_READ_REG(&adapter->hw, IXGBE_FCTRL);
2104 1.1 dyoung reg_rctl &= (~IXGBE_FCTRL_UPE);
2105 1.14.2.5 riz if (ifp->if_flags & IFF_ALLMULTI)
2106 1.14.2.5 riz mcnt = MAX_NUM_MULTICAST_ADDRESSES;
2107 1.14.2.5 riz else {
2108 1.14.2.5 riz ETHER_FIRST_MULTI(step, ec, enm);
2109 1.14.2.5 riz while (enm != NULL) {
2110 1.14.2.5 riz if (mcnt == MAX_NUM_MULTICAST_ADDRESSES)
2111 1.14.2.5 riz break;
2112 1.14.2.5 riz mcnt++;
2113 1.14.2.5 riz ETHER_NEXT_MULTI(step, enm);
2114 1.14.2.5 riz }
2115 1.14.2.5 riz }
2116 1.14.2.5 riz if (mcnt < MAX_NUM_MULTICAST_ADDRESSES)
2117 1.14.2.5 riz reg_rctl &= (~IXGBE_FCTRL_MPE);
2118 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_FCTRL, reg_rctl);
2119 1.1 dyoung
2120 1.1 dyoung if (ifp->if_flags & IFF_PROMISC) {
2121 1.1 dyoung reg_rctl |= (IXGBE_FCTRL_UPE | IXGBE_FCTRL_MPE);
2122 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_FCTRL, reg_rctl);
2123 1.1 dyoung } else if (ifp->if_flags & IFF_ALLMULTI) {
2124 1.1 dyoung reg_rctl |= IXGBE_FCTRL_MPE;
2125 1.1 dyoung reg_rctl &= ~IXGBE_FCTRL_UPE;
2126 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_FCTRL, reg_rctl);
2127 1.1 dyoung }
2128 1.1 dyoung return;
2129 1.1 dyoung }
2130 1.1 dyoung
2131 1.1 dyoung
2132 1.1 dyoung /*********************************************************************
2133 1.1 dyoung * Multicast Update
2134 1.1 dyoung *
2135 1.1 dyoung * This routine is called whenever multicast address list is updated.
2136 1.1 dyoung *
2137 1.1 dyoung **********************************************************************/
2138 1.1 dyoung #define IXGBE_RAR_ENTRIES 16
2139 1.1 dyoung
2140 1.1 dyoung static void
2141 1.1 dyoung ixgbe_set_multi(struct adapter *adapter)
2142 1.1 dyoung {
2143 1.1 dyoung struct ether_multi *enm;
2144 1.1 dyoung struct ether_multistep step;
2145 1.1 dyoung u32 fctrl;
2146 1.1 dyoung u8 *mta;
2147 1.1 dyoung u8 *update_ptr;
2148 1.1 dyoung int mcnt = 0;
2149 1.1 dyoung struct ethercom *ec = &adapter->osdep.ec;
2150 1.1 dyoung struct ifnet *ifp = adapter->ifp;
2151 1.1 dyoung
2152 1.1 dyoung IOCTL_DEBUGOUT("ixgbe_set_multi: begin");
2153 1.1 dyoung
2154 1.1 dyoung mta = adapter->mta;
2155 1.1 dyoung bzero(mta, sizeof(u8) * IXGBE_ETH_LENGTH_OF_ADDRESS *
2156 1.1 dyoung MAX_NUM_MULTICAST_ADDRESSES);
2157 1.1 dyoung
2158 1.14.2.5 riz ifp->if_flags &= ~IFF_ALLMULTI;
2159 1.1 dyoung ETHER_FIRST_MULTI(step, ec, enm);
2160 1.1 dyoung while (enm != NULL) {
2161 1.14.2.5 riz if ((mcnt == MAX_NUM_MULTICAST_ADDRESSES) ||
2162 1.14.2.5 riz (memcmp(enm->enm_addrlo, enm->enm_addrhi,
2163 1.14.2.5 riz ETHER_ADDR_LEN) != 0)) {
2164 1.14.2.5 riz ifp->if_flags |= IFF_ALLMULTI;
2165 1.1 dyoung break;
2166 1.1 dyoung }
2167 1.1 dyoung bcopy(enm->enm_addrlo,
2168 1.1 dyoung &mta[mcnt * IXGBE_ETH_LENGTH_OF_ADDRESS],
2169 1.1 dyoung IXGBE_ETH_LENGTH_OF_ADDRESS);
2170 1.1 dyoung mcnt++;
2171 1.1 dyoung ETHER_NEXT_MULTI(step, enm);
2172 1.1 dyoung }
2173 1.1 dyoung
2174 1.14.2.5 riz fctrl = IXGBE_READ_REG(&adapter->hw, IXGBE_FCTRL);
2175 1.14.2.5 riz fctrl &= ~(IXGBE_FCTRL_UPE | IXGBE_FCTRL_MPE);
2176 1.14.2.5 riz if (ifp->if_flags & IFF_PROMISC)
2177 1.14.2.5 riz fctrl |= (IXGBE_FCTRL_UPE | IXGBE_FCTRL_MPE);
2178 1.14.2.5 riz else if (ifp->if_flags & IFF_ALLMULTI) {
2179 1.14.2.5 riz fctrl |= IXGBE_FCTRL_MPE;
2180 1.14.2.5 riz }
2181 1.14.2.5 riz
2182 1.14.2.5 riz IXGBE_WRITE_REG(&adapter->hw, IXGBE_FCTRL, fctrl);
2183 1.14.2.5 riz
2184 1.14.2.5 riz if (mcnt < MAX_NUM_MULTICAST_ADDRESSES) {
2185 1.14.2.5 riz update_ptr = mta;
2186 1.14.2.5 riz ixgbe_update_mc_addr_list(&adapter->hw,
2187 1.14.2.5 riz update_ptr, mcnt, ixgbe_mc_array_itr, TRUE);
2188 1.14.2.5 riz }
2189 1.1 dyoung
2190 1.1 dyoung return;
2191 1.1 dyoung }
2192 1.1 dyoung
2193 1.1 dyoung /*
2194 1.1 dyoung * This is an iterator function now needed by the multicast
2195 1.1 dyoung * shared code. It simply feeds the shared code routine the
2196 1.1 dyoung * addresses in the array of ixgbe_set_multi() one by one.
2197 1.1 dyoung */
2198 1.1 dyoung static u8 *
2199 1.1 dyoung ixgbe_mc_array_itr(struct ixgbe_hw *hw, u8 **update_ptr, u32 *vmdq)
2200 1.1 dyoung {
2201 1.1 dyoung u8 *addr = *update_ptr;
2202 1.1 dyoung u8 *newptr;
2203 1.1 dyoung *vmdq = 0;
2204 1.1 dyoung
2205 1.1 dyoung newptr = addr + IXGBE_ETH_LENGTH_OF_ADDRESS;
2206 1.1 dyoung *update_ptr = newptr;
2207 1.1 dyoung return addr;
2208 1.1 dyoung }
2209 1.1 dyoung
2210 1.1 dyoung
2211 1.1 dyoung /*********************************************************************
2212 1.1 dyoung * Timer routine
2213 1.1 dyoung *
2214 1.1 dyoung * This routine checks for link status,updates statistics,
2215 1.1 dyoung * and runs the watchdog check.
2216 1.1 dyoung *
2217 1.1 dyoung **********************************************************************/
2218 1.1 dyoung
2219 1.1 dyoung static void
2220 1.1 dyoung ixgbe_local_timer1(void *arg)
2221 1.1 dyoung {
2222 1.14.2.4 riz struct adapter *adapter = arg;
2223 1.1 dyoung device_t dev = adapter->dev;
2224 1.14.2.4 riz struct ix_queue *que = adapter->queues;
2225 1.14.2.4 riz struct tx_ring *txr = adapter->tx_rings;
2226 1.14.2.4 riz int hung = 0, paused = 0;
2227 1.1 dyoung
2228 1.1 dyoung KASSERT(mutex_owned(&adapter->core_mtx));
2229 1.1 dyoung
2230 1.1 dyoung /* Check for pluggable optics */
2231 1.1 dyoung if (adapter->sfp_probe)
2232 1.1 dyoung if (!ixgbe_sfp_probe(adapter))
2233 1.1 dyoung goto out; /* Nothing to do */
2234 1.1 dyoung
2235 1.1 dyoung ixgbe_update_link_status(adapter);
2236 1.1 dyoung ixgbe_update_stats_counters(adapter);
2237 1.1 dyoung
2238 1.1 dyoung /*
2239 1.1 dyoung * If the interface has been paused
2240 1.1 dyoung * then don't do the watchdog check
2241 1.1 dyoung */
2242 1.1 dyoung if (IXGBE_READ_REG(&adapter->hw, IXGBE_TFCS) & IXGBE_TFCS_TXOFF)
2243 1.14.2.4 riz paused = 1;
2244 1.1 dyoung
2245 1.1 dyoung /*
2246 1.14.2.4 riz ** Check the TX queues status
2247 1.14.2.4 riz ** - watchdog only if all queues show hung
2248 1.14.2.4 riz */
2249 1.14.2.4 riz for (int i = 0; i < adapter->num_queues; i++, que++, txr++) {
2250 1.14.2.4 riz if ((txr->queue_status == IXGBE_QUEUE_HUNG) &&
2251 1.14.2.4 riz (paused == 0))
2252 1.14.2.4 riz ++hung;
2253 1.14.2.4 riz else if (txr->queue_status == IXGBE_QUEUE_WORKING)
2254 1.14.2.6 snj #ifndef IXGBE_LEGACY_TX
2255 1.14.2.6 snj softint_schedule(txr->txq_si);
2256 1.14.2.6 snj #else
2257 1.14.2.4 riz softint_schedule(que->que_si);
2258 1.14.2.6 snj #endif
2259 1.14.2.4 riz }
2260 1.14.2.4 riz /* Only truely watchdog if all queues show hung */
2261 1.14.2.4 riz if (hung == adapter->num_queues)
2262 1.14.2.4 riz goto watchdog;
2263 1.1 dyoung
2264 1.1 dyoung out:
2265 1.1 dyoung callout_reset(&adapter->timer, hz, ixgbe_local_timer, adapter);
2266 1.1 dyoung return;
2267 1.1 dyoung
2268 1.14.2.4 riz watchdog:
2269 1.1 dyoung device_printf(adapter->dev, "Watchdog timeout -- resetting\n");
2270 1.1 dyoung device_printf(dev,"Queue(%d) tdh = %d, hw tdt = %d\n", txr->me,
2271 1.1 dyoung IXGBE_READ_REG(&adapter->hw, IXGBE_TDH(txr->me)),
2272 1.1 dyoung IXGBE_READ_REG(&adapter->hw, IXGBE_TDT(txr->me)));
2273 1.1 dyoung device_printf(dev,"TX(%d) desc avail = %d,"
2274 1.1 dyoung "Next TX to Clean = %d\n",
2275 1.1 dyoung txr->me, txr->tx_avail, txr->next_to_clean);
2276 1.1 dyoung adapter->ifp->if_flags &= ~IFF_RUNNING;
2277 1.1 dyoung adapter->watchdog_events.ev_count++;
2278 1.1 dyoung ixgbe_init_locked(adapter);
2279 1.1 dyoung }
2280 1.1 dyoung
2281 1.1 dyoung static void
2282 1.1 dyoung ixgbe_local_timer(void *arg)
2283 1.1 dyoung {
2284 1.1 dyoung struct adapter *adapter = arg;
2285 1.1 dyoung
2286 1.1 dyoung IXGBE_CORE_LOCK(adapter);
2287 1.1 dyoung ixgbe_local_timer1(adapter);
2288 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
2289 1.1 dyoung }
2290 1.1 dyoung
2291 1.1 dyoung /*
2292 1.1 dyoung ** Note: this routine updates the OS on the link state
2293 1.1 dyoung ** the real check of the hardware only happens with
2294 1.1 dyoung ** a link interrupt.
2295 1.1 dyoung */
2296 1.1 dyoung static void
2297 1.1 dyoung ixgbe_update_link_status(struct adapter *adapter)
2298 1.1 dyoung {
2299 1.1 dyoung struct ifnet *ifp = adapter->ifp;
2300 1.1 dyoung device_t dev = adapter->dev;
2301 1.1 dyoung
2302 1.1 dyoung
2303 1.1 dyoung if (adapter->link_up){
2304 1.1 dyoung if (adapter->link_active == FALSE) {
2305 1.1 dyoung if (bootverbose)
2306 1.1 dyoung device_printf(dev,"Link is up %d Gbps %s \n",
2307 1.1 dyoung ((adapter->link_speed == 128)? 10:1),
2308 1.1 dyoung "Full Duplex");
2309 1.1 dyoung adapter->link_active = TRUE;
2310 1.14.2.4 riz /* Update any Flow Control changes */
2311 1.14.2.4 riz ixgbe_fc_enable(&adapter->hw);
2312 1.1 dyoung if_link_state_change(ifp, LINK_STATE_UP);
2313 1.1 dyoung }
2314 1.1 dyoung } else { /* Link down */
2315 1.1 dyoung if (adapter->link_active == TRUE) {
2316 1.1 dyoung if (bootverbose)
2317 1.1 dyoung device_printf(dev,"Link is Down\n");
2318 1.1 dyoung if_link_state_change(ifp, LINK_STATE_DOWN);
2319 1.1 dyoung adapter->link_active = FALSE;
2320 1.1 dyoung }
2321 1.1 dyoung }
2322 1.1 dyoung
2323 1.1 dyoung return;
2324 1.1 dyoung }
2325 1.1 dyoung
2326 1.1 dyoung
2327 1.1 dyoung static void
2328 1.1 dyoung ixgbe_ifstop(struct ifnet *ifp, int disable)
2329 1.1 dyoung {
2330 1.1 dyoung struct adapter *adapter = ifp->if_softc;
2331 1.1 dyoung
2332 1.1 dyoung IXGBE_CORE_LOCK(adapter);
2333 1.1 dyoung ixgbe_stop(adapter);
2334 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
2335 1.1 dyoung }
2336 1.1 dyoung
2337 1.1 dyoung /*********************************************************************
2338 1.1 dyoung *
2339 1.1 dyoung * This routine disables all traffic on the adapter by issuing a
2340 1.1 dyoung * global reset on the MAC and deallocates TX/RX buffers.
2341 1.1 dyoung *
2342 1.1 dyoung **********************************************************************/
2343 1.1 dyoung
2344 1.1 dyoung static void
2345 1.1 dyoung ixgbe_stop(void *arg)
2346 1.1 dyoung {
2347 1.1 dyoung struct ifnet *ifp;
2348 1.1 dyoung struct adapter *adapter = arg;
2349 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
2350 1.1 dyoung ifp = adapter->ifp;
2351 1.1 dyoung
2352 1.1 dyoung KASSERT(mutex_owned(&adapter->core_mtx));
2353 1.1 dyoung
2354 1.1 dyoung INIT_DEBUGOUT("ixgbe_stop: begin\n");
2355 1.1 dyoung ixgbe_disable_intr(adapter);
2356 1.14.2.4 riz callout_stop(&adapter->timer);
2357 1.1 dyoung
2358 1.14.2.4 riz /* Let the stack know...*/
2359 1.14.2.4 riz ifp->if_flags &= ~IFF_RUNNING;
2360 1.1 dyoung
2361 1.1 dyoung ixgbe_reset_hw(hw);
2362 1.1 dyoung hw->adapter_stopped = FALSE;
2363 1.1 dyoung ixgbe_stop_adapter(hw);
2364 1.14.2.6 snj if (hw->mac.type == ixgbe_mac_82599EB)
2365 1.14.2.6 snj ixgbe_stop_mac_link_on_d3_82599(hw);
2366 1.14.2.6 snj /* Turn off the laser - noop with no optics */
2367 1.14.2.6 snj ixgbe_disable_tx_laser(hw);
2368 1.14.2.6 snj
2369 1.14.2.6 snj /* Update the stack */
2370 1.14.2.6 snj adapter->link_up = FALSE;
2371 1.14.2.6 snj ixgbe_update_link_status(adapter);
2372 1.1 dyoung
2373 1.1 dyoung /* reprogram the RAR[0] in case user changed it. */
2374 1.1 dyoung ixgbe_set_rar(&adapter->hw, 0, adapter->hw.mac.addr, 0, IXGBE_RAH_AV);
2375 1.1 dyoung
2376 1.1 dyoung return;
2377 1.1 dyoung }
2378 1.1 dyoung
2379 1.1 dyoung
2380 1.1 dyoung /*********************************************************************
2381 1.1 dyoung *
2382 1.1 dyoung * Determine hardware revision.
2383 1.1 dyoung *
2384 1.1 dyoung **********************************************************************/
2385 1.1 dyoung static void
2386 1.1 dyoung ixgbe_identify_hardware(struct adapter *adapter)
2387 1.1 dyoung {
2388 1.1 dyoung pcitag_t tag;
2389 1.1 dyoung pci_chipset_tag_t pc;
2390 1.1 dyoung pcireg_t subid, id;
2391 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
2392 1.1 dyoung
2393 1.1 dyoung pc = adapter->osdep.pc;
2394 1.1 dyoung tag = adapter->osdep.tag;
2395 1.1 dyoung
2396 1.1 dyoung id = pci_conf_read(pc, tag, PCI_ID_REG);
2397 1.1 dyoung subid = pci_conf_read(pc, tag, PCI_SUBSYS_ID_REG);
2398 1.1 dyoung
2399 1.1 dyoung /* Save off the information about this board */
2400 1.1 dyoung hw->vendor_id = PCI_VENDOR(id);
2401 1.1 dyoung hw->device_id = PCI_PRODUCT(id);
2402 1.1 dyoung hw->revision_id =
2403 1.1 dyoung PCI_REVISION(pci_conf_read(pc, tag, PCI_CLASS_REG));
2404 1.1 dyoung hw->subsystem_vendor_id = PCI_SUBSYS_VENDOR(subid);
2405 1.1 dyoung hw->subsystem_device_id = PCI_SUBSYS_ID(subid);
2406 1.1 dyoung
2407 1.1 dyoung /* We need this here to set the num_segs below */
2408 1.1 dyoung ixgbe_set_mac_type(hw);
2409 1.1 dyoung
2410 1.1 dyoung /* Pick up the 82599 and VF settings */
2411 1.1 dyoung if (hw->mac.type != ixgbe_mac_82598EB) {
2412 1.1 dyoung hw->phy.smart_speed = ixgbe_smart_speed;
2413 1.1 dyoung adapter->num_segs = IXGBE_82599_SCATTER;
2414 1.1 dyoung } else
2415 1.1 dyoung adapter->num_segs = IXGBE_82598_SCATTER;
2416 1.1 dyoung
2417 1.1 dyoung return;
2418 1.1 dyoung }
2419 1.1 dyoung
2420 1.1 dyoung /*********************************************************************
2421 1.1 dyoung *
2422 1.1 dyoung * Determine optic type
2423 1.1 dyoung *
2424 1.1 dyoung **********************************************************************/
2425 1.1 dyoung static void
2426 1.1 dyoung ixgbe_setup_optics(struct adapter *adapter)
2427 1.1 dyoung {
2428 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
2429 1.1 dyoung int layer;
2430 1.14.2.5 riz
2431 1.1 dyoung layer = ixgbe_get_supported_physical_layer(hw);
2432 1.14.2.4 riz
2433 1.14.2.4 riz if (layer & IXGBE_PHYSICAL_LAYER_10GBASE_T) {
2434 1.14.2.4 riz adapter->optics = IFM_10G_T;
2435 1.14.2.4 riz return;
2436 1.14.2.4 riz }
2437 1.14.2.4 riz
2438 1.14.2.4 riz if (layer & IXGBE_PHYSICAL_LAYER_1000BASE_T) {
2439 1.14.2.4 riz adapter->optics = IFM_1000_T;
2440 1.14.2.4 riz return;
2441 1.14.2.4 riz }
2442 1.14.2.4 riz
2443 1.14.2.4 riz if (layer & IXGBE_PHYSICAL_LAYER_1000BASE_SX) {
2444 1.14.2.4 riz adapter->optics = IFM_1000_SX;
2445 1.14.2.4 riz return;
2446 1.14.2.4 riz }
2447 1.14.2.4 riz
2448 1.14.2.4 riz if (layer & (IXGBE_PHYSICAL_LAYER_10GBASE_LR |
2449 1.14.2.4 riz IXGBE_PHYSICAL_LAYER_10GBASE_LRM)) {
2450 1.14.2.4 riz adapter->optics = IFM_10G_LR;
2451 1.14.2.4 riz return;
2452 1.1 dyoung }
2453 1.14.2.4 riz
2454 1.14.2.4 riz if (layer & IXGBE_PHYSICAL_LAYER_10GBASE_SR) {
2455 1.14.2.4 riz adapter->optics = IFM_10G_SR;
2456 1.14.2.4 riz return;
2457 1.14.2.4 riz }
2458 1.14.2.4 riz
2459 1.14.2.4 riz if (layer & IXGBE_PHYSICAL_LAYER_SFP_PLUS_CU) {
2460 1.14.2.4 riz adapter->optics = IFM_10G_TWINAX;
2461 1.14.2.4 riz return;
2462 1.14.2.4 riz }
2463 1.14.2.4 riz
2464 1.14.2.4 riz if (layer & (IXGBE_PHYSICAL_LAYER_10GBASE_KX4 |
2465 1.14.2.4 riz IXGBE_PHYSICAL_LAYER_10GBASE_CX4)) {
2466 1.14.2.4 riz adapter->optics = IFM_10G_CX4;
2467 1.14.2.4 riz return;
2468 1.14.2.4 riz }
2469 1.14.2.4 riz
2470 1.14.2.4 riz /* If we get here just set the default */
2471 1.14.2.4 riz adapter->optics = IFM_ETHER | IFM_AUTO;
2472 1.1 dyoung return;
2473 1.1 dyoung }
2474 1.1 dyoung
2475 1.1 dyoung /*********************************************************************
2476 1.1 dyoung *
2477 1.1 dyoung * Setup the Legacy or MSI Interrupt handler
2478 1.1 dyoung *
2479 1.1 dyoung **********************************************************************/
2480 1.1 dyoung static int
2481 1.1 dyoung ixgbe_allocate_legacy(struct adapter *adapter, const struct pci_attach_args *pa)
2482 1.1 dyoung {
2483 1.14.2.5 riz device_t dev = adapter->dev;
2484 1.1 dyoung struct ix_queue *que = adapter->queues;
2485 1.14.2.5 riz #ifndef IXGBE_LEGACY_TX
2486 1.14.2.4 riz struct tx_ring *txr = adapter->tx_rings;
2487 1.14.2.4 riz #endif
2488 1.9 skrll char intrbuf[PCI_INTRSTR_LEN];
2489 1.9 skrll #if 0
2490 1.14.2.5 riz int rid = 0;
2491 1.1 dyoung
2492 1.1 dyoung /* MSI RID at 1 */
2493 1.1 dyoung if (adapter->msix == 1)
2494 1.1 dyoung rid = 1;
2495 1.9 skrll #endif
2496 1.1 dyoung
2497 1.1 dyoung /* We allocate a single interrupt resource */
2498 1.1 dyoung if (pci_intr_map(pa, &adapter->osdep.ih) != 0) {
2499 1.1 dyoung aprint_error_dev(dev, "unable to map interrupt\n");
2500 1.1 dyoung return ENXIO;
2501 1.1 dyoung } else {
2502 1.1 dyoung aprint_normal_dev(dev, "interrupting at %s\n",
2503 1.14 chs pci_intr_string(adapter->osdep.pc, adapter->osdep.ih,
2504 1.14 chs intrbuf, sizeof(intrbuf)));
2505 1.1 dyoung }
2506 1.1 dyoung
2507 1.1 dyoung /*
2508 1.1 dyoung * Try allocating a fast interrupt and the associated deferred
2509 1.1 dyoung * processing contexts.
2510 1.1 dyoung */
2511 1.14.2.5 riz #ifndef IXGBE_LEGACY_TX
2512 1.14.2.4 riz txr->txq_si = softint_establish(SOFTINT_NET, ixgbe_deferred_mq_start,
2513 1.14.2.4 riz txr);
2514 1.14.2.4 riz #endif
2515 1.1 dyoung que->que_si = softint_establish(SOFTINT_NET, ixgbe_handle_que, que);
2516 1.1 dyoung
2517 1.1 dyoung /* Tasklets for Link, SFP and Multispeed Fiber */
2518 1.1 dyoung adapter->link_si =
2519 1.1 dyoung softint_establish(SOFTINT_NET, ixgbe_handle_link, adapter);
2520 1.1 dyoung adapter->mod_si =
2521 1.1 dyoung softint_establish(SOFTINT_NET, ixgbe_handle_mod, adapter);
2522 1.1 dyoung adapter->msf_si =
2523 1.1 dyoung softint_establish(SOFTINT_NET, ixgbe_handle_msf, adapter);
2524 1.1 dyoung
2525 1.1 dyoung #ifdef IXGBE_FDIR
2526 1.1 dyoung adapter->fdir_si =
2527 1.1 dyoung softint_establish(SOFTINT_NET, ixgbe_reinit_fdir, adapter);
2528 1.1 dyoung #endif
2529 1.1 dyoung if (que->que_si == NULL ||
2530 1.1 dyoung adapter->link_si == NULL ||
2531 1.1 dyoung adapter->mod_si == NULL ||
2532 1.1 dyoung #ifdef IXGBE_FDIR
2533 1.1 dyoung adapter->fdir_si == NULL ||
2534 1.1 dyoung #endif
2535 1.1 dyoung adapter->msf_si == NULL) {
2536 1.1 dyoung aprint_error_dev(dev,
2537 1.1 dyoung "could not establish software interrupts\n");
2538 1.1 dyoung return ENXIO;
2539 1.1 dyoung }
2540 1.1 dyoung
2541 1.1 dyoung adapter->osdep.intr = pci_intr_establish(adapter->osdep.pc,
2542 1.1 dyoung adapter->osdep.ih, IPL_NET, ixgbe_legacy_irq, que);
2543 1.1 dyoung if (adapter->osdep.intr == NULL) {
2544 1.1 dyoung aprint_error_dev(dev, "failed to register interrupt handler\n");
2545 1.1 dyoung softint_disestablish(que->que_si);
2546 1.1 dyoung softint_disestablish(adapter->link_si);
2547 1.1 dyoung softint_disestablish(adapter->mod_si);
2548 1.1 dyoung softint_disestablish(adapter->msf_si);
2549 1.1 dyoung #ifdef IXGBE_FDIR
2550 1.1 dyoung softint_disestablish(adapter->fdir_si);
2551 1.1 dyoung #endif
2552 1.1 dyoung return ENXIO;
2553 1.1 dyoung }
2554 1.1 dyoung /* For simplicity in the handlers */
2555 1.1 dyoung adapter->que_mask = IXGBE_EIMS_ENABLE_MASK;
2556 1.1 dyoung
2557 1.1 dyoung return (0);
2558 1.1 dyoung }
2559 1.1 dyoung
2560 1.1 dyoung
2561 1.1 dyoung /*********************************************************************
2562 1.1 dyoung *
2563 1.1 dyoung * Setup MSIX Interrupt resources and handlers
2564 1.1 dyoung *
2565 1.1 dyoung **********************************************************************/
2566 1.1 dyoung static int
2567 1.1 dyoung ixgbe_allocate_msix(struct adapter *adapter, const struct pci_attach_args *pa)
2568 1.1 dyoung {
2569 1.1 dyoung #if !defined(NETBSD_MSI_OR_MSIX)
2570 1.1 dyoung return 0;
2571 1.1 dyoung #else
2572 1.1 dyoung device_t dev = adapter->dev;
2573 1.1 dyoung struct ix_queue *que = adapter->queues;
2574 1.14.2.4 riz struct tx_ring *txr = adapter->tx_rings;
2575 1.1 dyoung int error, rid, vector = 0;
2576 1.14.2.6 snj int cpu_id = 0;
2577 1.14.2.6 snj #ifdef RSS
2578 1.14.2.6 snj cpuset_t cpu_mask;
2579 1.14.2.6 snj #endif
2580 1.14.2.6 snj
2581 1.14.2.6 snj #ifdef RSS
2582 1.14.2.6 snj /*
2583 1.14.2.6 snj * If we're doing RSS, the number of queues needs to
2584 1.14.2.6 snj * match the number of RSS buckets that are configured.
2585 1.14.2.6 snj *
2586 1.14.2.6 snj * + If there's more queues than RSS buckets, we'll end
2587 1.14.2.6 snj * up with queues that get no traffic.
2588 1.14.2.6 snj *
2589 1.14.2.6 snj * + If there's more RSS buckets than queues, we'll end
2590 1.14.2.6 snj * up having multiple RSS buckets map to the same queue,
2591 1.14.2.6 snj * so there'll be some contention.
2592 1.14.2.6 snj */
2593 1.14.2.6 snj if (adapter->num_queues != rss_getnumbuckets()) {
2594 1.14.2.6 snj device_printf(dev,
2595 1.14.2.6 snj "%s: number of queues (%d) != number of RSS buckets (%d)"
2596 1.14.2.6 snj "; performance will be impacted.\n",
2597 1.14.2.6 snj __func__,
2598 1.14.2.6 snj adapter->num_queues,
2599 1.14.2.6 snj rss_getnumbuckets());
2600 1.14.2.6 snj }
2601 1.14.2.6 snj #endif
2602 1.1 dyoung
2603 1.14.2.4 riz for (int i = 0; i < adapter->num_queues; i++, vector++, que++, txr++) {
2604 1.1 dyoung rid = vector + 1;
2605 1.1 dyoung que->res = bus_alloc_resource_any(dev, SYS_RES_IRQ, &rid,
2606 1.1 dyoung RF_SHAREABLE | RF_ACTIVE);
2607 1.1 dyoung if (que->res == NULL) {
2608 1.1 dyoung aprint_error_dev(dev,"Unable to allocate"
2609 1.1 dyoung " bus resource: que interrupt [%d]\n", vector);
2610 1.1 dyoung return (ENXIO);
2611 1.1 dyoung }
2612 1.1 dyoung /* Set the handler function */
2613 1.1 dyoung error = bus_setup_intr(dev, que->res,
2614 1.1 dyoung INTR_TYPE_NET | INTR_MPSAFE, NULL,
2615 1.1 dyoung ixgbe_msix_que, que, &que->tag);
2616 1.1 dyoung if (error) {
2617 1.1 dyoung que->res = NULL;
2618 1.1 dyoung aprint_error_dev(dev,
2619 1.1 dyoung "Failed to register QUE handler\n");
2620 1.1 dyoung return error;
2621 1.1 dyoung }
2622 1.1 dyoung #if __FreeBSD_version >= 800504
2623 1.1 dyoung bus_describe_intr(dev, que->res, que->tag, "que %d", i);
2624 1.1 dyoung #endif
2625 1.1 dyoung que->msix = vector;
2626 1.1 dyoung adapter->que_mask |= (u64)(1 << que->msix);
2627 1.14.2.6 snj #ifdef RSS
2628 1.1 dyoung /*
2629 1.14.2.6 snj * The queue ID is used as the RSS layer bucket ID.
2630 1.14.2.6 snj * We look up the queue ID -> RSS CPU ID and select
2631 1.14.2.6 snj * that.
2632 1.14.2.6 snj */
2633 1.14.2.6 snj cpu_id = rss_getcpu(i % rss_getnumbuckets());
2634 1.14.2.6 snj #else
2635 1.14.2.6 snj /*
2636 1.14.2.6 snj * Bind the msix vector, and thus the
2637 1.14.2.6 snj * rings to the corresponding cpu.
2638 1.14.2.6 snj *
2639 1.14.2.6 snj * This just happens to match the default RSS round-robin
2640 1.14.2.6 snj * bucket -> queue -> CPU allocation.
2641 1.14.2.6 snj */
2642 1.1 dyoung if (adapter->num_queues > 1)
2643 1.14.2.6 snj cpu_id = i;
2644 1.14.2.6 snj #endif
2645 1.14.2.6 snj if (adapter->num_queues > 1)
2646 1.14.2.6 snj bus_bind_intr(dev, que->res, cpu_id);
2647 1.14.2.6 snj
2648 1.14.2.6 snj #ifdef RSS
2649 1.14.2.6 snj device_printf(dev,
2650 1.14.2.6 snj "Bound RSS bucket %d to CPU %d\n",
2651 1.14.2.6 snj i, cpu_id);
2652 1.14.2.6 snj #else
2653 1.14.2.6 snj device_printf(dev,
2654 1.14.2.6 snj "Bound queue %d to cpu %d\n",
2655 1.14.2.6 snj i, cpu_id);
2656 1.14.2.6 snj #endif
2657 1.1 dyoung
2658 1.14.2.5 riz #ifndef IXGBE_LEGACY_TX
2659 1.14.2.4 riz txr->txq_si = softint_establish(SOFTINT_NET,
2660 1.14.2.4 riz ixgbe_deferred_mq_start, txr);
2661 1.14.2.4 riz #endif
2662 1.14.2.4 riz que->que_si = softint_establish(SOFTINT_NET, ixgbe_handle_que,
2663 1.14.2.4 riz que);
2664 1.1 dyoung if (que->que_si == NULL) {
2665 1.1 dyoung aprint_error_dev(dev,
2666 1.1 dyoung "could not establish software interrupt\n");
2667 1.1 dyoung }
2668 1.1 dyoung }
2669 1.1 dyoung
2670 1.1 dyoung /* and Link */
2671 1.1 dyoung rid = vector + 1;
2672 1.1 dyoung adapter->res = bus_alloc_resource_any(dev,
2673 1.1 dyoung SYS_RES_IRQ, &rid, RF_SHAREABLE | RF_ACTIVE);
2674 1.1 dyoung if (!adapter->res) {
2675 1.1 dyoung aprint_error_dev(dev,"Unable to allocate bus resource: "
2676 1.1 dyoung "Link interrupt [%d]\n", rid);
2677 1.1 dyoung return (ENXIO);
2678 1.1 dyoung }
2679 1.1 dyoung /* Set the link handler function */
2680 1.1 dyoung error = bus_setup_intr(dev, adapter->res,
2681 1.1 dyoung INTR_TYPE_NET | INTR_MPSAFE, NULL,
2682 1.1 dyoung ixgbe_msix_link, adapter, &adapter->tag);
2683 1.1 dyoung if (error) {
2684 1.1 dyoung adapter->res = NULL;
2685 1.1 dyoung aprint_error_dev(dev, "Failed to register LINK handler\n");
2686 1.1 dyoung return (error);
2687 1.1 dyoung }
2688 1.1 dyoung #if __FreeBSD_version >= 800504
2689 1.1 dyoung bus_describe_intr(dev, adapter->res, adapter->tag, "link");
2690 1.1 dyoung #endif
2691 1.1 dyoung adapter->linkvec = vector;
2692 1.1 dyoung /* Tasklets for Link, SFP and Multispeed Fiber */
2693 1.1 dyoung adapter->link_si =
2694 1.1 dyoung softint_establish(SOFTINT_NET, ixgbe_handle_link, adapter);
2695 1.1 dyoung adapter->mod_si =
2696 1.1 dyoung softint_establish(SOFTINT_NET, ixgbe_handle_mod, adapter);
2697 1.1 dyoung adapter->msf_si =
2698 1.1 dyoung softint_establish(SOFTINT_NET, ixgbe_handle_msf, adapter);
2699 1.1 dyoung #ifdef IXGBE_FDIR
2700 1.1 dyoung adapter->fdir_si =
2701 1.1 dyoung softint_establish(SOFTINT_NET, ixgbe_reinit_fdir, adapter);
2702 1.1 dyoung #endif
2703 1.1 dyoung
2704 1.1 dyoung return (0);
2705 1.1 dyoung #endif
2706 1.1 dyoung }
2707 1.1 dyoung
2708 1.1 dyoung /*
2709 1.1 dyoung * Setup Either MSI/X or MSI
2710 1.1 dyoung */
2711 1.1 dyoung static int
2712 1.1 dyoung ixgbe_setup_msix(struct adapter *adapter)
2713 1.1 dyoung {
2714 1.1 dyoung #if !defined(NETBSD_MSI_OR_MSIX)
2715 1.1 dyoung return 0;
2716 1.1 dyoung #else
2717 1.1 dyoung device_t dev = adapter->dev;
2718 1.1 dyoung int rid, want, queues, msgs;
2719 1.1 dyoung
2720 1.1 dyoung /* Override by tuneable */
2721 1.1 dyoung if (ixgbe_enable_msix == 0)
2722 1.1 dyoung goto msi;
2723 1.1 dyoung
2724 1.1 dyoung /* First try MSI/X */
2725 1.14.2.6 snj msgs = pci_msix_count(dev);
2726 1.14.2.6 snj if (msgs == 0)
2727 1.14.2.6 snj goto msi;
2728 1.1 dyoung rid = PCI_BAR(MSIX_82598_BAR);
2729 1.1 dyoung adapter->msix_mem = bus_alloc_resource_any(dev,
2730 1.1 dyoung SYS_RES_MEMORY, &rid, RF_ACTIVE);
2731 1.14.2.6 snj if (adapter->msix_mem == NULL) {
2732 1.1 dyoung rid += 4; /* 82599 maps in higher BAR */
2733 1.1 dyoung adapter->msix_mem = bus_alloc_resource_any(dev,
2734 1.1 dyoung SYS_RES_MEMORY, &rid, RF_ACTIVE);
2735 1.1 dyoung }
2736 1.14.2.6 snj if (adapter->msix_mem == NULL) {
2737 1.1 dyoung /* May not be enabled */
2738 1.1 dyoung device_printf(adapter->dev,
2739 1.1 dyoung "Unable to map MSIX table \n");
2740 1.1 dyoung goto msi;
2741 1.1 dyoung }
2742 1.1 dyoung
2743 1.1 dyoung /* Figure out a reasonable auto config value */
2744 1.1 dyoung queues = (mp_ncpus > (msgs-1)) ? (msgs-1) : mp_ncpus;
2745 1.1 dyoung
2746 1.14.2.6 snj /* Override based on tuneable */
2747 1.1 dyoung if (ixgbe_num_queues != 0)
2748 1.1 dyoung queues = ixgbe_num_queues;
2749 1.14.2.6 snj
2750 1.14.2.6 snj #ifdef RSS
2751 1.14.2.6 snj /* If we're doing RSS, clamp at the number of RSS buckets */
2752 1.14.2.6 snj if (queues > rss_getnumbuckets())
2753 1.14.2.6 snj queues = rss_getnumbuckets();
2754 1.14.2.6 snj #endif
2755 1.14.2.6 snj
2756 1.14.2.6 snj /* reflect correct sysctl value */
2757 1.14.2.6 snj ixgbe_num_queues = queues;
2758 1.1 dyoung
2759 1.1 dyoung /*
2760 1.1 dyoung ** Want one vector (RX/TX pair) per queue
2761 1.1 dyoung ** plus an additional for Link.
2762 1.1 dyoung */
2763 1.1 dyoung want = queues + 1;
2764 1.1 dyoung if (msgs >= want)
2765 1.1 dyoung msgs = want;
2766 1.1 dyoung else {
2767 1.1 dyoung device_printf(adapter->dev,
2768 1.1 dyoung "MSIX Configuration Problem, "
2769 1.1 dyoung "%d vectors but %d queues wanted!\n",
2770 1.1 dyoung msgs, want);
2771 1.14.2.6 snj goto msi;
2772 1.1 dyoung }
2773 1.14.2.6 snj if ((pci_alloc_msix(dev, &msgs) == 0) && (msgs == want)) {
2774 1.1 dyoung device_printf(adapter->dev,
2775 1.1 dyoung "Using MSIX interrupts with %d vectors\n", msgs);
2776 1.1 dyoung adapter->num_queues = queues;
2777 1.1 dyoung return (msgs);
2778 1.1 dyoung }
2779 1.14.2.6 snj /*
2780 1.14.2.6 snj ** If MSIX alloc failed or provided us with
2781 1.14.2.6 snj ** less than needed, free and fall through to MSI
2782 1.14.2.6 snj */
2783 1.14.2.6 snj pci_release_msi(dev);
2784 1.14.2.6 snj
2785 1.1 dyoung msi:
2786 1.1 dyoung msgs = pci_msi_count(dev);
2787 1.14.2.6 snj if (adapter->msix_mem != NULL) {
2788 1.14.2.6 snj bus_release_resource(dev, SYS_RES_MEMORY,
2789 1.14.2.6 snj rid, adapter->msix_mem);
2790 1.14.2.6 snj adapter->msix_mem = NULL;
2791 1.14.2.6 snj }
2792 1.14.2.6 snj msgs = 1;
2793 1.14.2.6 snj if (pci_alloc_msi(dev, &msgs) == 0) {
2794 1.14.2.3 martin device_printf(adapter->dev,"Using an MSI interrupt\n");
2795 1.14.2.6 snj return (msgs);
2796 1.14.2.6 snj }
2797 1.14.2.6 snj device_printf(adapter->dev,"Using a Legacy interrupt\n");
2798 1.14.2.6 snj return (0);
2799 1.1 dyoung #endif
2800 1.1 dyoung }
2801 1.1 dyoung
2802 1.1 dyoung
2803 1.1 dyoung static int
2804 1.1 dyoung ixgbe_allocate_pci_resources(struct adapter *adapter, const struct pci_attach_args *pa)
2805 1.1 dyoung {
2806 1.1 dyoung pcireg_t memtype;
2807 1.1 dyoung device_t dev = adapter->dev;
2808 1.1 dyoung bus_addr_t addr;
2809 1.1 dyoung int flags;
2810 1.1 dyoung
2811 1.1 dyoung memtype = pci_mapreg_type(pa->pa_pc, pa->pa_tag, PCI_BAR(0));
2812 1.1 dyoung switch (memtype) {
2813 1.1 dyoung case PCI_MAPREG_TYPE_MEM | PCI_MAPREG_MEM_TYPE_32BIT:
2814 1.1 dyoung case PCI_MAPREG_TYPE_MEM | PCI_MAPREG_MEM_TYPE_64BIT:
2815 1.1 dyoung adapter->osdep.mem_bus_space_tag = pa->pa_memt;
2816 1.1 dyoung if (pci_mapreg_info(pa->pa_pc, pa->pa_tag, PCI_BAR(0),
2817 1.1 dyoung memtype, &addr, &adapter->osdep.mem_size, &flags) != 0)
2818 1.1 dyoung goto map_err;
2819 1.1 dyoung if ((flags & BUS_SPACE_MAP_PREFETCHABLE) != 0) {
2820 1.1 dyoung aprint_normal_dev(dev, "clearing prefetchable bit\n");
2821 1.1 dyoung flags &= ~BUS_SPACE_MAP_PREFETCHABLE;
2822 1.1 dyoung }
2823 1.1 dyoung if (bus_space_map(adapter->osdep.mem_bus_space_tag, addr,
2824 1.1 dyoung adapter->osdep.mem_size, flags,
2825 1.1 dyoung &adapter->osdep.mem_bus_space_handle) != 0) {
2826 1.1 dyoung map_err:
2827 1.1 dyoung adapter->osdep.mem_size = 0;
2828 1.1 dyoung aprint_error_dev(dev, "unable to map BAR0\n");
2829 1.1 dyoung return ENXIO;
2830 1.1 dyoung }
2831 1.1 dyoung break;
2832 1.1 dyoung default:
2833 1.1 dyoung aprint_error_dev(dev, "unexpected type on BAR0\n");
2834 1.1 dyoung return ENXIO;
2835 1.1 dyoung }
2836 1.1 dyoung
2837 1.1 dyoung /* Legacy defaults */
2838 1.1 dyoung adapter->num_queues = 1;
2839 1.1 dyoung adapter->hw.back = &adapter->osdep;
2840 1.1 dyoung
2841 1.1 dyoung /*
2842 1.1 dyoung ** Now setup MSI or MSI/X, should
2843 1.1 dyoung ** return us the number of supported
2844 1.1 dyoung ** vectors. (Will be 1 for MSI)
2845 1.1 dyoung */
2846 1.1 dyoung adapter->msix = ixgbe_setup_msix(adapter);
2847 1.1 dyoung return (0);
2848 1.1 dyoung }
2849 1.1 dyoung
2850 1.1 dyoung static void
2851 1.1 dyoung ixgbe_free_pci_resources(struct adapter * adapter)
2852 1.1 dyoung {
2853 1.1 dyoung #if defined(NETBSD_MSI_OR_MSIX)
2854 1.1 dyoung struct ix_queue *que = adapter->queues;
2855 1.14 chs device_t dev = adapter->dev;
2856 1.1 dyoung #endif
2857 1.9 skrll int rid;
2858 1.1 dyoung
2859 1.9 skrll #if defined(NETBSD_MSI_OR_MSIX)
2860 1.9 skrll int memrid;
2861 1.1 dyoung if (adapter->hw.mac.type == ixgbe_mac_82598EB)
2862 1.1 dyoung memrid = PCI_BAR(MSIX_82598_BAR);
2863 1.1 dyoung else
2864 1.1 dyoung memrid = PCI_BAR(MSIX_82599_BAR);
2865 1.1 dyoung
2866 1.1 dyoung /*
2867 1.1 dyoung ** There is a slight possibility of a failure mode
2868 1.1 dyoung ** in attach that will result in entering this function
2869 1.1 dyoung ** before interrupt resources have been initialized, and
2870 1.1 dyoung ** in that case we do not want to execute the loops below
2871 1.1 dyoung ** We can detect this reliably by the state of the adapter
2872 1.1 dyoung ** res pointer.
2873 1.1 dyoung */
2874 1.1 dyoung if (adapter->res == NULL)
2875 1.1 dyoung goto mem;
2876 1.1 dyoung
2877 1.1 dyoung /*
2878 1.1 dyoung ** Release all msix queue resources:
2879 1.1 dyoung */
2880 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, que++) {
2881 1.1 dyoung rid = que->msix + 1;
2882 1.1 dyoung if (que->tag != NULL) {
2883 1.1 dyoung bus_teardown_intr(dev, que->res, que->tag);
2884 1.1 dyoung que->tag = NULL;
2885 1.1 dyoung }
2886 1.1 dyoung if (que->res != NULL)
2887 1.1 dyoung bus_release_resource(dev, SYS_RES_IRQ, rid, que->res);
2888 1.1 dyoung }
2889 1.1 dyoung #endif
2890 1.1 dyoung
2891 1.1 dyoung /* Clean the Legacy or Link interrupt last */
2892 1.1 dyoung if (adapter->linkvec) /* we are doing MSIX */
2893 1.1 dyoung rid = adapter->linkvec + 1;
2894 1.1 dyoung else
2895 1.1 dyoung (adapter->msix != 0) ? (rid = 1):(rid = 0);
2896 1.1 dyoung
2897 1.14.2.6 snj if (adapter->osdep.intr != NULL)
2898 1.14.2.6 snj pci_intr_disestablish(adapter->osdep.pc, adapter->osdep.intr);
2899 1.1 dyoung adapter->osdep.intr = NULL;
2900 1.1 dyoung
2901 1.1 dyoung #if defined(NETBSD_MSI_OR_MSIX)
2902 1.1 dyoung mem:
2903 1.1 dyoung if (adapter->msix)
2904 1.1 dyoung pci_release_msi(dev);
2905 1.1 dyoung
2906 1.1 dyoung if (adapter->msix_mem != NULL)
2907 1.1 dyoung bus_release_resource(dev, SYS_RES_MEMORY,
2908 1.1 dyoung memrid, adapter->msix_mem);
2909 1.1 dyoung #endif
2910 1.1 dyoung
2911 1.1 dyoung if (adapter->osdep.mem_size != 0) {
2912 1.1 dyoung bus_space_unmap(adapter->osdep.mem_bus_space_tag,
2913 1.1 dyoung adapter->osdep.mem_bus_space_handle,
2914 1.1 dyoung adapter->osdep.mem_size);
2915 1.1 dyoung }
2916 1.1 dyoung
2917 1.1 dyoung return;
2918 1.1 dyoung }
2919 1.1 dyoung
2920 1.1 dyoung /*********************************************************************
2921 1.1 dyoung *
2922 1.1 dyoung * Setup networking device structure and register an interface.
2923 1.1 dyoung *
2924 1.1 dyoung **********************************************************************/
2925 1.1 dyoung static int
2926 1.1 dyoung ixgbe_setup_interface(device_t dev, struct adapter *adapter)
2927 1.1 dyoung {
2928 1.1 dyoung struct ethercom *ec = &adapter->osdep.ec;
2929 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
2930 1.1 dyoung struct ifnet *ifp;
2931 1.1 dyoung
2932 1.1 dyoung INIT_DEBUGOUT("ixgbe_setup_interface: begin");
2933 1.1 dyoung
2934 1.1 dyoung ifp = adapter->ifp = &ec->ec_if;
2935 1.1 dyoung strlcpy(ifp->if_xname, device_xname(dev), IFNAMSIZ);
2936 1.14.2.4 riz ifp->if_baudrate = IF_Gbps(10);
2937 1.1 dyoung ifp->if_init = ixgbe_init;
2938 1.1 dyoung ifp->if_stop = ixgbe_ifstop;
2939 1.1 dyoung ifp->if_softc = adapter;
2940 1.1 dyoung ifp->if_flags = IFF_BROADCAST | IFF_SIMPLEX | IFF_MULTICAST;
2941 1.1 dyoung ifp->if_ioctl = ixgbe_ioctl;
2942 1.14.2.5 riz #ifndef IXGBE_LEGACY_TX
2943 1.1 dyoung ifp->if_transmit = ixgbe_mq_start;
2944 1.1 dyoung ifp->if_qflush = ixgbe_qflush;
2945 1.14.2.4 riz #else
2946 1.14.2.4 riz ifp->if_start = ixgbe_start;
2947 1.14.2.4 riz IFQ_SET_MAXLEN(&ifp->if_snd, adapter->num_tx_desc - 2);
2948 1.14.2.6 snj #if 0
2949 1.14.2.6 snj ifp->if_snd.ifq_drv_maxlen = adapter->num_tx_desc - 2;
2950 1.14.2.6 snj #endif
2951 1.14.2.6 snj IFQ_SET_READY(&ifp->if_snd);
2952 1.1 dyoung #endif
2953 1.1 dyoung
2954 1.1 dyoung if_attach(ifp);
2955 1.1 dyoung ether_ifattach(ifp, adapter->hw.mac.addr);
2956 1.1 dyoung ether_set_ifflags_cb(ec, ixgbe_ifflags_cb);
2957 1.1 dyoung
2958 1.1 dyoung adapter->max_frame_size =
2959 1.1 dyoung ifp->if_mtu + ETHER_HDR_LEN + ETHER_CRC_LEN;
2960 1.1 dyoung
2961 1.1 dyoung /*
2962 1.1 dyoung * Tell the upper layer(s) we support long frames.
2963 1.1 dyoung */
2964 1.1 dyoung ifp->if_hdrlen = sizeof(struct ether_vlan_header);
2965 1.1 dyoung
2966 1.14.2.4 riz ifp->if_capabilities |= IFCAP_HWCSUM | IFCAP_TSOv4 | IFCAP_TSOv6;
2967 1.1 dyoung ifp->if_capenable = 0;
2968 1.1 dyoung
2969 1.1 dyoung ec->ec_capabilities |= ETHERCAP_VLAN_HWCSUM;
2970 1.1 dyoung ec->ec_capabilities |= ETHERCAP_JUMBO_MTU;
2971 1.14.2.4 riz ifp->if_capabilities |= IFCAP_LRO;
2972 1.14.2.3 martin ec->ec_capabilities |= ETHERCAP_VLAN_HWTAGGING
2973 1.14.2.3 martin | ETHERCAP_VLAN_MTU;
2974 1.1 dyoung ec->ec_capenable = ec->ec_capabilities;
2975 1.1 dyoung
2976 1.1 dyoung /*
2977 1.14.2.3 martin ** Don't turn this on by default, if vlans are
2978 1.1 dyoung ** created on another pseudo device (eg. lagg)
2979 1.1 dyoung ** then vlan events are not passed thru, breaking
2980 1.1 dyoung ** operation, but with HW FILTER off it works. If
2981 1.14.2.3 martin ** using vlans directly on the ixgbe driver you can
2982 1.1 dyoung ** enable this and get full hardware tag filtering.
2983 1.1 dyoung */
2984 1.1 dyoung ec->ec_capabilities |= ETHERCAP_VLAN_HWFILTER;
2985 1.1 dyoung
2986 1.1 dyoung /*
2987 1.1 dyoung * Specify the media types supported by this adapter and register
2988 1.1 dyoung * callbacks to update media and link information
2989 1.1 dyoung */
2990 1.1 dyoung ifmedia_init(&adapter->media, IFM_IMASK, ixgbe_media_change,
2991 1.1 dyoung ixgbe_media_status);
2992 1.1 dyoung ifmedia_add(&adapter->media, IFM_ETHER | adapter->optics, 0, NULL);
2993 1.1 dyoung ifmedia_set(&adapter->media, IFM_ETHER | adapter->optics);
2994 1.1 dyoung if (hw->device_id == IXGBE_DEV_ID_82598AT) {
2995 1.1 dyoung ifmedia_add(&adapter->media,
2996 1.1 dyoung IFM_ETHER | IFM_1000_T | IFM_FDX, 0, NULL);
2997 1.1 dyoung ifmedia_add(&adapter->media,
2998 1.1 dyoung IFM_ETHER | IFM_1000_T, 0, NULL);
2999 1.1 dyoung }
3000 1.1 dyoung ifmedia_add(&adapter->media, IFM_ETHER | IFM_AUTO, 0, NULL);
3001 1.1 dyoung ifmedia_set(&adapter->media, IFM_ETHER | IFM_AUTO);
3002 1.1 dyoung
3003 1.1 dyoung return (0);
3004 1.1 dyoung }
3005 1.1 dyoung
3006 1.1 dyoung static void
3007 1.1 dyoung ixgbe_config_link(struct adapter *adapter)
3008 1.1 dyoung {
3009 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
3010 1.1 dyoung u32 autoneg, err = 0;
3011 1.1 dyoung bool sfp, negotiate;
3012 1.1 dyoung
3013 1.1 dyoung sfp = ixgbe_is_sfp(hw);
3014 1.1 dyoung
3015 1.1 dyoung if (sfp) {
3016 1.14.2.2 martin void *ip;
3017 1.14.2.2 martin
3018 1.1 dyoung if (hw->phy.multispeed_fiber) {
3019 1.1 dyoung hw->mac.ops.setup_sfp(hw);
3020 1.1 dyoung ixgbe_enable_tx_laser(hw);
3021 1.14.2.2 martin ip = adapter->msf_si;
3022 1.1 dyoung } else {
3023 1.14.2.2 martin ip = adapter->mod_si;
3024 1.1 dyoung }
3025 1.14.2.2 martin
3026 1.14.2.2 martin kpreempt_disable();
3027 1.14.2.2 martin softint_schedule(ip);
3028 1.14.2.2 martin kpreempt_enable();
3029 1.1 dyoung } else {
3030 1.1 dyoung if (hw->mac.ops.check_link)
3031 1.14.2.5 riz err = ixgbe_check_link(hw, &adapter->link_speed,
3032 1.1 dyoung &adapter->link_up, FALSE);
3033 1.1 dyoung if (err)
3034 1.1 dyoung goto out;
3035 1.1 dyoung autoneg = hw->phy.autoneg_advertised;
3036 1.1 dyoung if ((!autoneg) && (hw->mac.ops.get_link_capabilities))
3037 1.1 dyoung err = hw->mac.ops.get_link_capabilities(hw,
3038 1.1 dyoung &autoneg, &negotiate);
3039 1.13 christos else
3040 1.13 christos negotiate = 0;
3041 1.1 dyoung if (err)
3042 1.1 dyoung goto out;
3043 1.1 dyoung if (hw->mac.ops.setup_link)
3044 1.14.2.5 riz err = hw->mac.ops.setup_link(hw,
3045 1.14.2.5 riz autoneg, adapter->link_up);
3046 1.1 dyoung }
3047 1.1 dyoung out:
3048 1.1 dyoung return;
3049 1.1 dyoung }
3050 1.1 dyoung
3051 1.1 dyoung /********************************************************************
3052 1.1 dyoung * Manage DMA'able memory.
3053 1.1 dyoung *******************************************************************/
3054 1.1 dyoung
3055 1.1 dyoung static int
3056 1.1 dyoung ixgbe_dma_malloc(struct adapter *adapter, const bus_size_t size,
3057 1.1 dyoung struct ixgbe_dma_alloc *dma, const int mapflags)
3058 1.1 dyoung {
3059 1.1 dyoung device_t dev = adapter->dev;
3060 1.1 dyoung int r, rsegs;
3061 1.1 dyoung
3062 1.1 dyoung r = ixgbe_dma_tag_create(adapter->osdep.dmat, /* parent */
3063 1.1 dyoung DBA_ALIGN, 0, /* alignment, bounds */
3064 1.1 dyoung size, /* maxsize */
3065 1.1 dyoung 1, /* nsegments */
3066 1.1 dyoung size, /* maxsegsize */
3067 1.1 dyoung BUS_DMA_ALLOCNOW, /* flags */
3068 1.1 dyoung &dma->dma_tag);
3069 1.1 dyoung if (r != 0) {
3070 1.1 dyoung aprint_error_dev(dev,
3071 1.1 dyoung "%s: ixgbe_dma_tag_create failed; error %d\n", __func__, r);
3072 1.1 dyoung goto fail_0;
3073 1.1 dyoung }
3074 1.1 dyoung
3075 1.1 dyoung r = bus_dmamem_alloc(dma->dma_tag->dt_dmat,
3076 1.1 dyoung size,
3077 1.1 dyoung dma->dma_tag->dt_alignment,
3078 1.1 dyoung dma->dma_tag->dt_boundary,
3079 1.1 dyoung &dma->dma_seg, 1, &rsegs, BUS_DMA_NOWAIT);
3080 1.1 dyoung if (r != 0) {
3081 1.1 dyoung aprint_error_dev(dev,
3082 1.1 dyoung "%s: bus_dmamem_alloc failed; error %d\n", __func__, r);
3083 1.1 dyoung goto fail_1;
3084 1.1 dyoung }
3085 1.1 dyoung
3086 1.1 dyoung r = bus_dmamem_map(dma->dma_tag->dt_dmat, &dma->dma_seg, rsegs,
3087 1.1 dyoung size, &dma->dma_vaddr, BUS_DMA_NOWAIT);
3088 1.1 dyoung if (r != 0) {
3089 1.1 dyoung aprint_error_dev(dev, "%s: bus_dmamem_map failed; error %d\n",
3090 1.1 dyoung __func__, r);
3091 1.1 dyoung goto fail_2;
3092 1.1 dyoung }
3093 1.1 dyoung
3094 1.1 dyoung r = ixgbe_dmamap_create(dma->dma_tag, 0, &dma->dma_map);
3095 1.1 dyoung if (r != 0) {
3096 1.1 dyoung aprint_error_dev(dev, "%s: bus_dmamem_map failed; error %d\n",
3097 1.1 dyoung __func__, r);
3098 1.1 dyoung goto fail_3;
3099 1.1 dyoung }
3100 1.1 dyoung
3101 1.1 dyoung r = bus_dmamap_load(dma->dma_tag->dt_dmat, dma->dma_map, dma->dma_vaddr,
3102 1.1 dyoung size,
3103 1.1 dyoung NULL,
3104 1.1 dyoung mapflags | BUS_DMA_NOWAIT);
3105 1.1 dyoung if (r != 0) {
3106 1.1 dyoung aprint_error_dev(dev, "%s: bus_dmamap_load failed; error %d\n",
3107 1.1 dyoung __func__, r);
3108 1.1 dyoung goto fail_4;
3109 1.1 dyoung }
3110 1.1 dyoung dma->dma_paddr = dma->dma_map->dm_segs[0].ds_addr;
3111 1.1 dyoung dma->dma_size = size;
3112 1.1 dyoung return 0;
3113 1.1 dyoung fail_4:
3114 1.1 dyoung ixgbe_dmamap_destroy(dma->dma_tag, dma->dma_map);
3115 1.1 dyoung fail_3:
3116 1.1 dyoung bus_dmamem_unmap(dma->dma_tag->dt_dmat, dma->dma_vaddr, size);
3117 1.1 dyoung fail_2:
3118 1.1 dyoung bus_dmamem_free(dma->dma_tag->dt_dmat, &dma->dma_seg, rsegs);
3119 1.1 dyoung fail_1:
3120 1.1 dyoung ixgbe_dma_tag_destroy(dma->dma_tag);
3121 1.1 dyoung fail_0:
3122 1.1 dyoung return r;
3123 1.1 dyoung }
3124 1.1 dyoung
3125 1.1 dyoung static void
3126 1.1 dyoung ixgbe_dma_free(struct adapter *adapter, struct ixgbe_dma_alloc *dma)
3127 1.1 dyoung {
3128 1.1 dyoung bus_dmamap_sync(dma->dma_tag->dt_dmat, dma->dma_map, 0, dma->dma_size,
3129 1.1 dyoung BUS_DMASYNC_POSTREAD | BUS_DMASYNC_POSTWRITE);
3130 1.1 dyoung ixgbe_dmamap_unload(dma->dma_tag, dma->dma_map);
3131 1.1 dyoung bus_dmamem_free(dma->dma_tag->dt_dmat, &dma->dma_seg, 1);
3132 1.1 dyoung ixgbe_dma_tag_destroy(dma->dma_tag);
3133 1.1 dyoung }
3134 1.1 dyoung
3135 1.1 dyoung
3136 1.1 dyoung /*********************************************************************
3137 1.1 dyoung *
3138 1.1 dyoung * Allocate memory for the transmit and receive rings, and then
3139 1.1 dyoung * the descriptors associated with each, called only once at attach.
3140 1.1 dyoung *
3141 1.1 dyoung **********************************************************************/
3142 1.1 dyoung static int
3143 1.1 dyoung ixgbe_allocate_queues(struct adapter *adapter)
3144 1.1 dyoung {
3145 1.1 dyoung device_t dev = adapter->dev;
3146 1.1 dyoung struct ix_queue *que;
3147 1.1 dyoung struct tx_ring *txr;
3148 1.1 dyoung struct rx_ring *rxr;
3149 1.1 dyoung int rsize, tsize, error = IXGBE_SUCCESS;
3150 1.1 dyoung int txconf = 0, rxconf = 0;
3151 1.1 dyoung
3152 1.1 dyoung /* First allocate the top level queue structs */
3153 1.1 dyoung if (!(adapter->queues =
3154 1.1 dyoung (struct ix_queue *) malloc(sizeof(struct ix_queue) *
3155 1.1 dyoung adapter->num_queues, M_DEVBUF, M_NOWAIT | M_ZERO))) {
3156 1.1 dyoung aprint_error_dev(dev, "Unable to allocate queue memory\n");
3157 1.1 dyoung error = ENOMEM;
3158 1.1 dyoung goto fail;
3159 1.1 dyoung }
3160 1.1 dyoung
3161 1.1 dyoung /* First allocate the TX ring struct memory */
3162 1.1 dyoung if (!(adapter->tx_rings =
3163 1.1 dyoung (struct tx_ring *) malloc(sizeof(struct tx_ring) *
3164 1.1 dyoung adapter->num_queues, M_DEVBUF, M_NOWAIT | M_ZERO))) {
3165 1.1 dyoung aprint_error_dev(dev, "Unable to allocate TX ring memory\n");
3166 1.1 dyoung error = ENOMEM;
3167 1.1 dyoung goto tx_fail;
3168 1.1 dyoung }
3169 1.1 dyoung
3170 1.1 dyoung /* Next allocate the RX */
3171 1.1 dyoung if (!(adapter->rx_rings =
3172 1.1 dyoung (struct rx_ring *) malloc(sizeof(struct rx_ring) *
3173 1.1 dyoung adapter->num_queues, M_DEVBUF, M_NOWAIT | M_ZERO))) {
3174 1.1 dyoung aprint_error_dev(dev, "Unable to allocate RX ring memory\n");
3175 1.1 dyoung error = ENOMEM;
3176 1.1 dyoung goto rx_fail;
3177 1.1 dyoung }
3178 1.1 dyoung
3179 1.1 dyoung /* For the ring itself */
3180 1.1 dyoung tsize = roundup2(adapter->num_tx_desc *
3181 1.1 dyoung sizeof(union ixgbe_adv_tx_desc), DBA_ALIGN);
3182 1.1 dyoung
3183 1.1 dyoung /*
3184 1.1 dyoung * Now set up the TX queues, txconf is needed to handle the
3185 1.1 dyoung * possibility that things fail midcourse and we need to
3186 1.1 dyoung * undo memory gracefully
3187 1.1 dyoung */
3188 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, txconf++) {
3189 1.1 dyoung /* Set up some basics */
3190 1.1 dyoung txr = &adapter->tx_rings[i];
3191 1.1 dyoung txr->adapter = adapter;
3192 1.1 dyoung txr->me = i;
3193 1.14.2.5 riz txr->num_desc = adapter->num_tx_desc;
3194 1.1 dyoung
3195 1.1 dyoung /* Initialize the TX side lock */
3196 1.1 dyoung snprintf(txr->mtx_name, sizeof(txr->mtx_name), "%s:tx(%d)",
3197 1.1 dyoung device_xname(dev), txr->me);
3198 1.1 dyoung mutex_init(&txr->tx_mtx, MUTEX_DEFAULT, IPL_NET);
3199 1.1 dyoung
3200 1.1 dyoung if (ixgbe_dma_malloc(adapter, tsize,
3201 1.1 dyoung &txr->txdma, BUS_DMA_NOWAIT)) {
3202 1.1 dyoung aprint_error_dev(dev,
3203 1.1 dyoung "Unable to allocate TX Descriptor memory\n");
3204 1.1 dyoung error = ENOMEM;
3205 1.1 dyoung goto err_tx_desc;
3206 1.1 dyoung }
3207 1.1 dyoung txr->tx_base = (union ixgbe_adv_tx_desc *)txr->txdma.dma_vaddr;
3208 1.1 dyoung bzero((void *)txr->tx_base, tsize);
3209 1.1 dyoung
3210 1.1 dyoung /* Now allocate transmit buffers for the ring */
3211 1.1 dyoung if (ixgbe_allocate_transmit_buffers(txr)) {
3212 1.1 dyoung aprint_error_dev(dev,
3213 1.1 dyoung "Critical Failure setting up transmit buffers\n");
3214 1.1 dyoung error = ENOMEM;
3215 1.1 dyoung goto err_tx_desc;
3216 1.1 dyoung }
3217 1.14.2.5 riz #ifndef IXGBE_LEGACY_TX
3218 1.1 dyoung /* Allocate a buf ring */
3219 1.1 dyoung txr->br = buf_ring_alloc(IXGBE_BR_SIZE, M_DEVBUF,
3220 1.1 dyoung M_WAITOK, &txr->tx_mtx);
3221 1.1 dyoung if (txr->br == NULL) {
3222 1.1 dyoung aprint_error_dev(dev,
3223 1.1 dyoung "Critical Failure setting up buf ring\n");
3224 1.1 dyoung error = ENOMEM;
3225 1.1 dyoung goto err_tx_desc;
3226 1.1 dyoung }
3227 1.1 dyoung #endif
3228 1.1 dyoung }
3229 1.1 dyoung
3230 1.1 dyoung /*
3231 1.1 dyoung * Next the RX queues...
3232 1.1 dyoung */
3233 1.1 dyoung rsize = roundup2(adapter->num_rx_desc *
3234 1.1 dyoung sizeof(union ixgbe_adv_rx_desc), DBA_ALIGN);
3235 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, rxconf++) {
3236 1.1 dyoung rxr = &adapter->rx_rings[i];
3237 1.1 dyoung /* Set up some basics */
3238 1.1 dyoung rxr->adapter = adapter;
3239 1.1 dyoung rxr->me = i;
3240 1.14.2.5 riz rxr->num_desc = adapter->num_rx_desc;
3241 1.1 dyoung
3242 1.1 dyoung /* Initialize the RX side lock */
3243 1.1 dyoung snprintf(rxr->mtx_name, sizeof(rxr->mtx_name), "%s:rx(%d)",
3244 1.1 dyoung device_xname(dev), rxr->me);
3245 1.1 dyoung mutex_init(&rxr->rx_mtx, MUTEX_DEFAULT, IPL_NET);
3246 1.1 dyoung
3247 1.1 dyoung if (ixgbe_dma_malloc(adapter, rsize,
3248 1.1 dyoung &rxr->rxdma, BUS_DMA_NOWAIT)) {
3249 1.1 dyoung aprint_error_dev(dev,
3250 1.1 dyoung "Unable to allocate RxDescriptor memory\n");
3251 1.1 dyoung error = ENOMEM;
3252 1.1 dyoung goto err_rx_desc;
3253 1.1 dyoung }
3254 1.1 dyoung rxr->rx_base = (union ixgbe_adv_rx_desc *)rxr->rxdma.dma_vaddr;
3255 1.1 dyoung bzero((void *)rxr->rx_base, rsize);
3256 1.1 dyoung
3257 1.1 dyoung /* Allocate receive buffers for the ring*/
3258 1.1 dyoung if (ixgbe_allocate_receive_buffers(rxr)) {
3259 1.1 dyoung aprint_error_dev(dev,
3260 1.1 dyoung "Critical Failure setting up receive buffers\n");
3261 1.1 dyoung error = ENOMEM;
3262 1.1 dyoung goto err_rx_desc;
3263 1.1 dyoung }
3264 1.1 dyoung }
3265 1.1 dyoung
3266 1.1 dyoung /*
3267 1.1 dyoung ** Finally set up the queue holding structs
3268 1.1 dyoung */
3269 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++) {
3270 1.1 dyoung que = &adapter->queues[i];
3271 1.1 dyoung que->adapter = adapter;
3272 1.1 dyoung que->txr = &adapter->tx_rings[i];
3273 1.1 dyoung que->rxr = &adapter->rx_rings[i];
3274 1.1 dyoung }
3275 1.1 dyoung
3276 1.1 dyoung return (0);
3277 1.1 dyoung
3278 1.1 dyoung err_rx_desc:
3279 1.1 dyoung for (rxr = adapter->rx_rings; rxconf > 0; rxr++, rxconf--)
3280 1.1 dyoung ixgbe_dma_free(adapter, &rxr->rxdma);
3281 1.1 dyoung err_tx_desc:
3282 1.1 dyoung for (txr = adapter->tx_rings; txconf > 0; txr++, txconf--)
3283 1.1 dyoung ixgbe_dma_free(adapter, &txr->txdma);
3284 1.1 dyoung free(adapter->rx_rings, M_DEVBUF);
3285 1.1 dyoung rx_fail:
3286 1.1 dyoung free(adapter->tx_rings, M_DEVBUF);
3287 1.1 dyoung tx_fail:
3288 1.1 dyoung free(adapter->queues, M_DEVBUF);
3289 1.1 dyoung fail:
3290 1.1 dyoung return (error);
3291 1.1 dyoung }
3292 1.1 dyoung
3293 1.1 dyoung /*********************************************************************
3294 1.1 dyoung *
3295 1.1 dyoung * Allocate memory for tx_buffer structures. The tx_buffer stores all
3296 1.1 dyoung * the information needed to transmit a packet on the wire. This is
3297 1.1 dyoung * called only once at attach, setup is done every reset.
3298 1.1 dyoung *
3299 1.1 dyoung **********************************************************************/
3300 1.1 dyoung static int
3301 1.1 dyoung ixgbe_allocate_transmit_buffers(struct tx_ring *txr)
3302 1.1 dyoung {
3303 1.1 dyoung struct adapter *adapter = txr->adapter;
3304 1.1 dyoung device_t dev = adapter->dev;
3305 1.1 dyoung struct ixgbe_tx_buf *txbuf;
3306 1.1 dyoung int error, i;
3307 1.1 dyoung
3308 1.1 dyoung /*
3309 1.1 dyoung * Setup DMA descriptor areas.
3310 1.1 dyoung */
3311 1.1 dyoung if ((error = ixgbe_dma_tag_create(adapter->osdep.dmat, /* parent */
3312 1.1 dyoung 1, 0, /* alignment, bounds */
3313 1.1 dyoung IXGBE_TSO_SIZE, /* maxsize */
3314 1.1 dyoung adapter->num_segs, /* nsegments */
3315 1.1 dyoung PAGE_SIZE, /* maxsegsize */
3316 1.1 dyoung 0, /* flags */
3317 1.1 dyoung &txr->txtag))) {
3318 1.1 dyoung aprint_error_dev(dev,"Unable to allocate TX DMA tag\n");
3319 1.1 dyoung goto fail;
3320 1.1 dyoung }
3321 1.1 dyoung
3322 1.1 dyoung if (!(txr->tx_buffers =
3323 1.1 dyoung (struct ixgbe_tx_buf *) malloc(sizeof(struct ixgbe_tx_buf) *
3324 1.1 dyoung adapter->num_tx_desc, M_DEVBUF, M_NOWAIT | M_ZERO))) {
3325 1.1 dyoung aprint_error_dev(dev, "Unable to allocate tx_buffer memory\n");
3326 1.1 dyoung error = ENOMEM;
3327 1.1 dyoung goto fail;
3328 1.1 dyoung }
3329 1.1 dyoung
3330 1.1 dyoung /* Create the descriptor buffer dma maps */
3331 1.1 dyoung txbuf = txr->tx_buffers;
3332 1.1 dyoung for (i = 0; i < adapter->num_tx_desc; i++, txbuf++) {
3333 1.1 dyoung error = ixgbe_dmamap_create(txr->txtag, 0, &txbuf->map);
3334 1.1 dyoung if (error != 0) {
3335 1.14.2.4 riz aprint_error_dev(dev,
3336 1.14.2.4 riz "Unable to create TX DMA map (%d)\n", error);
3337 1.1 dyoung goto fail;
3338 1.1 dyoung }
3339 1.1 dyoung }
3340 1.1 dyoung
3341 1.1 dyoung return 0;
3342 1.1 dyoung fail:
3343 1.1 dyoung /* We free all, it handles case where we are in the middle */
3344 1.1 dyoung ixgbe_free_transmit_structures(adapter);
3345 1.1 dyoung return (error);
3346 1.1 dyoung }
3347 1.1 dyoung
3348 1.1 dyoung /*********************************************************************
3349 1.1 dyoung *
3350 1.1 dyoung * Initialize a transmit ring.
3351 1.1 dyoung *
3352 1.1 dyoung **********************************************************************/
3353 1.1 dyoung static void
3354 1.1 dyoung ixgbe_setup_transmit_ring(struct tx_ring *txr)
3355 1.1 dyoung {
3356 1.1 dyoung struct adapter *adapter = txr->adapter;
3357 1.1 dyoung struct ixgbe_tx_buf *txbuf;
3358 1.1 dyoung int i;
3359 1.14.2.3 martin #ifdef DEV_NETMAP
3360 1.14.2.3 martin struct netmap_adapter *na = NA(adapter->ifp);
3361 1.14.2.3 martin struct netmap_slot *slot;
3362 1.14.2.3 martin #endif /* DEV_NETMAP */
3363 1.1 dyoung
3364 1.1 dyoung /* Clear the old ring contents */
3365 1.1 dyoung IXGBE_TX_LOCK(txr);
3366 1.14.2.3 martin #ifdef DEV_NETMAP
3367 1.14.2.3 martin /*
3368 1.14.2.3 martin * (under lock): if in netmap mode, do some consistency
3369 1.14.2.3 martin * checks and set slot to entry 0 of the netmap ring.
3370 1.14.2.3 martin */
3371 1.14.2.3 martin slot = netmap_reset(na, NR_TX, txr->me, 0);
3372 1.14.2.3 martin #endif /* DEV_NETMAP */
3373 1.1 dyoung bzero((void *)txr->tx_base,
3374 1.1 dyoung (sizeof(union ixgbe_adv_tx_desc)) * adapter->num_tx_desc);
3375 1.1 dyoung /* Reset indices */
3376 1.1 dyoung txr->next_avail_desc = 0;
3377 1.1 dyoung txr->next_to_clean = 0;
3378 1.1 dyoung
3379 1.1 dyoung /* Free any existing tx buffers. */
3380 1.1 dyoung txbuf = txr->tx_buffers;
3381 1.14.2.5 riz for (i = 0; i < txr->num_desc; i++, txbuf++) {
3382 1.1 dyoung if (txbuf->m_head != NULL) {
3383 1.1 dyoung bus_dmamap_sync(txr->txtag->dt_dmat, txbuf->map,
3384 1.1 dyoung 0, txbuf->m_head->m_pkthdr.len,
3385 1.1 dyoung BUS_DMASYNC_POSTWRITE);
3386 1.1 dyoung ixgbe_dmamap_unload(txr->txtag, txbuf->map);
3387 1.1 dyoung m_freem(txbuf->m_head);
3388 1.1 dyoung txbuf->m_head = NULL;
3389 1.1 dyoung }
3390 1.14.2.3 martin #ifdef DEV_NETMAP
3391 1.14.2.3 martin /*
3392 1.14.2.3 martin * In netmap mode, set the map for the packet buffer.
3393 1.14.2.3 martin * NOTE: Some drivers (not this one) also need to set
3394 1.14.2.3 martin * the physical buffer address in the NIC ring.
3395 1.14.2.3 martin * Slots in the netmap ring (indexed by "si") are
3396 1.14.2.3 martin * kring->nkr_hwofs positions "ahead" wrt the
3397 1.14.2.3 martin * corresponding slot in the NIC ring. In some drivers
3398 1.14.2.4 riz * (not here) nkr_hwofs can be negative. Function
3399 1.14.2.4 riz * netmap_idx_n2k() handles wraparounds properly.
3400 1.14.2.3 martin */
3401 1.14.2.3 martin if (slot) {
3402 1.14.2.4 riz int si = netmap_idx_n2k(&na->tx_rings[txr->me], i);
3403 1.14.2.6 snj netmap_load_map(na, txr->txtag, txbuf->map, NMB(na, slot + si));
3404 1.14.2.3 martin }
3405 1.14.2.3 martin #endif /* DEV_NETMAP */
3406 1.14.2.5 riz /* Clear the EOP descriptor pointer */
3407 1.14.2.5 riz txbuf->eop = NULL;
3408 1.1 dyoung }
3409 1.1 dyoung
3410 1.1 dyoung #ifdef IXGBE_FDIR
3411 1.1 dyoung /* Set the rate at which we sample packets */
3412 1.1 dyoung if (adapter->hw.mac.type != ixgbe_mac_82598EB)
3413 1.1 dyoung txr->atr_sample = atr_sample_rate;
3414 1.1 dyoung #endif
3415 1.1 dyoung
3416 1.1 dyoung /* Set number of descriptors available */
3417 1.1 dyoung txr->tx_avail = adapter->num_tx_desc;
3418 1.1 dyoung
3419 1.1 dyoung ixgbe_dmamap_sync(txr->txdma.dma_tag, txr->txdma.dma_map,
3420 1.1 dyoung BUS_DMASYNC_PREREAD | BUS_DMASYNC_PREWRITE);
3421 1.1 dyoung IXGBE_TX_UNLOCK(txr);
3422 1.1 dyoung }
3423 1.1 dyoung
3424 1.1 dyoung /*********************************************************************
3425 1.1 dyoung *
3426 1.1 dyoung * Initialize all transmit rings.
3427 1.1 dyoung *
3428 1.1 dyoung **********************************************************************/
3429 1.1 dyoung static int
3430 1.1 dyoung ixgbe_setup_transmit_structures(struct adapter *adapter)
3431 1.1 dyoung {
3432 1.1 dyoung struct tx_ring *txr = adapter->tx_rings;
3433 1.1 dyoung
3434 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, txr++)
3435 1.1 dyoung ixgbe_setup_transmit_ring(txr);
3436 1.1 dyoung
3437 1.1 dyoung return (0);
3438 1.1 dyoung }
3439 1.1 dyoung
3440 1.1 dyoung /*********************************************************************
3441 1.1 dyoung *
3442 1.1 dyoung * Enable transmit unit.
3443 1.1 dyoung *
3444 1.1 dyoung **********************************************************************/
3445 1.1 dyoung static void
3446 1.1 dyoung ixgbe_initialize_transmit_units(struct adapter *adapter)
3447 1.1 dyoung {
3448 1.1 dyoung struct tx_ring *txr = adapter->tx_rings;
3449 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
3450 1.1 dyoung
3451 1.1 dyoung /* Setup the Base and Length of the Tx Descriptor Ring */
3452 1.1 dyoung
3453 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, txr++) {
3454 1.1 dyoung u64 tdba = txr->txdma.dma_paddr;
3455 1.1 dyoung u32 txctrl;
3456 1.1 dyoung
3457 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_TDBAL(i),
3458 1.1 dyoung (tdba & 0x00000000ffffffffULL));
3459 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_TDBAH(i), (tdba >> 32));
3460 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_TDLEN(i),
3461 1.14.2.5 riz adapter->num_tx_desc * sizeof(union ixgbe_adv_tx_desc));
3462 1.1 dyoung
3463 1.1 dyoung /* Setup the HW Tx Head and Tail descriptor pointers */
3464 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_TDH(i), 0);
3465 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_TDT(i), 0);
3466 1.1 dyoung
3467 1.1 dyoung /* Setup Transmit Descriptor Cmd Settings */
3468 1.1 dyoung txr->txd_cmd = IXGBE_TXD_CMD_IFCS;
3469 1.1 dyoung txr->queue_status = IXGBE_QUEUE_IDLE;
3470 1.1 dyoung
3471 1.14.2.5 riz /* Set the processing limit */
3472 1.14.2.5 riz txr->process_limit = ixgbe_tx_process_limit;
3473 1.14.2.5 riz
3474 1.1 dyoung /* Disable Head Writeback */
3475 1.1 dyoung switch (hw->mac.type) {
3476 1.1 dyoung case ixgbe_mac_82598EB:
3477 1.1 dyoung txctrl = IXGBE_READ_REG(hw, IXGBE_DCA_TXCTRL(i));
3478 1.1 dyoung break;
3479 1.1 dyoung case ixgbe_mac_82599EB:
3480 1.14.2.4 riz case ixgbe_mac_X540:
3481 1.1 dyoung default:
3482 1.1 dyoung txctrl = IXGBE_READ_REG(hw, IXGBE_DCA_TXCTRL_82599(i));
3483 1.1 dyoung break;
3484 1.1 dyoung }
3485 1.14.2.4 riz txctrl &= ~IXGBE_DCA_TXCTRL_DESC_WRO_EN;
3486 1.1 dyoung switch (hw->mac.type) {
3487 1.1 dyoung case ixgbe_mac_82598EB:
3488 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_DCA_TXCTRL(i), txctrl);
3489 1.1 dyoung break;
3490 1.1 dyoung case ixgbe_mac_82599EB:
3491 1.14.2.4 riz case ixgbe_mac_X540:
3492 1.1 dyoung default:
3493 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_DCA_TXCTRL_82599(i), txctrl);
3494 1.1 dyoung break;
3495 1.1 dyoung }
3496 1.1 dyoung
3497 1.1 dyoung }
3498 1.1 dyoung
3499 1.1 dyoung if (hw->mac.type != ixgbe_mac_82598EB) {
3500 1.1 dyoung u32 dmatxctl, rttdcs;
3501 1.1 dyoung dmatxctl = IXGBE_READ_REG(hw, IXGBE_DMATXCTL);
3502 1.1 dyoung dmatxctl |= IXGBE_DMATXCTL_TE;
3503 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_DMATXCTL, dmatxctl);
3504 1.1 dyoung /* Disable arbiter to set MTQC */
3505 1.1 dyoung rttdcs = IXGBE_READ_REG(hw, IXGBE_RTTDCS);
3506 1.1 dyoung rttdcs |= IXGBE_RTTDCS_ARBDIS;
3507 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RTTDCS, rttdcs);
3508 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_MTQC, IXGBE_MTQC_64Q_1PB);
3509 1.1 dyoung rttdcs &= ~IXGBE_RTTDCS_ARBDIS;
3510 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RTTDCS, rttdcs);
3511 1.1 dyoung }
3512 1.1 dyoung
3513 1.1 dyoung return;
3514 1.1 dyoung }
3515 1.1 dyoung
3516 1.1 dyoung /*********************************************************************
3517 1.1 dyoung *
3518 1.1 dyoung * Free all transmit rings.
3519 1.1 dyoung *
3520 1.1 dyoung **********************************************************************/
3521 1.1 dyoung static void
3522 1.1 dyoung ixgbe_free_transmit_structures(struct adapter *adapter)
3523 1.1 dyoung {
3524 1.1 dyoung struct tx_ring *txr = adapter->tx_rings;
3525 1.1 dyoung
3526 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, txr++) {
3527 1.1 dyoung ixgbe_free_transmit_buffers(txr);
3528 1.1 dyoung ixgbe_dma_free(adapter, &txr->txdma);
3529 1.1 dyoung IXGBE_TX_LOCK_DESTROY(txr);
3530 1.1 dyoung }
3531 1.1 dyoung free(adapter->tx_rings, M_DEVBUF);
3532 1.1 dyoung }
3533 1.1 dyoung
3534 1.1 dyoung /*********************************************************************
3535 1.1 dyoung *
3536 1.1 dyoung * Free transmit ring related data structures.
3537 1.1 dyoung *
3538 1.1 dyoung **********************************************************************/
3539 1.1 dyoung static void
3540 1.1 dyoung ixgbe_free_transmit_buffers(struct tx_ring *txr)
3541 1.1 dyoung {
3542 1.1 dyoung struct adapter *adapter = txr->adapter;
3543 1.1 dyoung struct ixgbe_tx_buf *tx_buffer;
3544 1.1 dyoung int i;
3545 1.1 dyoung
3546 1.14.2.6 snj INIT_DEBUGOUT("ixgbe_free_transmit_ring: begin");
3547 1.1 dyoung
3548 1.1 dyoung if (txr->tx_buffers == NULL)
3549 1.1 dyoung return;
3550 1.1 dyoung
3551 1.1 dyoung tx_buffer = txr->tx_buffers;
3552 1.1 dyoung for (i = 0; i < adapter->num_tx_desc; i++, tx_buffer++) {
3553 1.1 dyoung if (tx_buffer->m_head != NULL) {
3554 1.1 dyoung bus_dmamap_sync(txr->txtag->dt_dmat, tx_buffer->map,
3555 1.1 dyoung 0, tx_buffer->m_head->m_pkthdr.len,
3556 1.1 dyoung BUS_DMASYNC_POSTWRITE);
3557 1.1 dyoung ixgbe_dmamap_unload(txr->txtag, tx_buffer->map);
3558 1.1 dyoung m_freem(tx_buffer->m_head);
3559 1.1 dyoung tx_buffer->m_head = NULL;
3560 1.1 dyoung if (tx_buffer->map != NULL) {
3561 1.1 dyoung ixgbe_dmamap_destroy(txr->txtag,
3562 1.1 dyoung tx_buffer->map);
3563 1.1 dyoung tx_buffer->map = NULL;
3564 1.1 dyoung }
3565 1.1 dyoung } else if (tx_buffer->map != NULL) {
3566 1.1 dyoung ixgbe_dmamap_unload(txr->txtag, tx_buffer->map);
3567 1.1 dyoung ixgbe_dmamap_destroy(txr->txtag, tx_buffer->map);
3568 1.1 dyoung tx_buffer->map = NULL;
3569 1.1 dyoung }
3570 1.1 dyoung }
3571 1.14.2.5 riz #ifndef IXGBE_LEGACY_TX
3572 1.1 dyoung if (txr->br != NULL)
3573 1.1 dyoung buf_ring_free(txr->br, M_DEVBUF);
3574 1.1 dyoung #endif
3575 1.1 dyoung if (txr->tx_buffers != NULL) {
3576 1.1 dyoung free(txr->tx_buffers, M_DEVBUF);
3577 1.1 dyoung txr->tx_buffers = NULL;
3578 1.1 dyoung }
3579 1.1 dyoung if (txr->txtag != NULL) {
3580 1.1 dyoung ixgbe_dma_tag_destroy(txr->txtag);
3581 1.1 dyoung txr->txtag = NULL;
3582 1.1 dyoung }
3583 1.1 dyoung return;
3584 1.1 dyoung }
3585 1.1 dyoung
3586 1.1 dyoung /*********************************************************************
3587 1.1 dyoung *
3588 1.14.2.5 riz * Advanced Context Descriptor setup for VLAN, CSUM or TSO
3589 1.1 dyoung *
3590 1.1 dyoung **********************************************************************/
3591 1.1 dyoung
3592 1.14.2.5 riz static int
3593 1.14.2.5 riz ixgbe_tx_ctx_setup(struct tx_ring *txr, struct mbuf *mp,
3594 1.14.2.5 riz u32 *cmd_type_len, u32 *olinfo_status)
3595 1.1 dyoung {
3596 1.1 dyoung struct m_tag *mtag;
3597 1.1 dyoung struct adapter *adapter = txr->adapter;
3598 1.1 dyoung struct ethercom *ec = &adapter->osdep.ec;
3599 1.1 dyoung struct ixgbe_adv_tx_context_desc *TXD;
3600 1.1 dyoung struct ether_vlan_header *eh;
3601 1.1 dyoung struct ip ip;
3602 1.1 dyoung struct ip6_hdr ip6;
3603 1.14.2.5 riz u32 vlan_macip_lens = 0, type_tucmd_mlhl = 0;
3604 1.14.2.5 riz int ehdrlen, ip_hlen = 0;
3605 1.1 dyoung u16 etype;
3606 1.12 hannken u8 ipproto __diagused = 0;
3607 1.14.2.5 riz int offload = TRUE;
3608 1.14.2.5 riz int ctxd = txr->next_avail_desc;
3609 1.14.2.5 riz u16 vtag = 0;
3610 1.14.2.5 riz
3611 1.14.2.5 riz /* First check if TSO is to be used */
3612 1.14.2.5 riz if (mp->m_pkthdr.csum_flags & (M_CSUM_TSOv4|M_CSUM_TSOv6))
3613 1.14.2.5 riz return (ixgbe_tso_setup(txr, mp, cmd_type_len, olinfo_status));
3614 1.1 dyoung
3615 1.14.2.5 riz if ((mp->m_pkthdr.csum_flags & M_CSUM_OFFLOAD) == 0)
3616 1.14.2.5 riz offload = FALSE;
3617 1.1 dyoung
3618 1.14.2.5 riz /* Indicate the whole packet as payload when not doing TSO */
3619 1.14.2.5 riz *olinfo_status |= mp->m_pkthdr.len << IXGBE_ADVTXD_PAYLEN_SHIFT;
3620 1.14.2.5 riz
3621 1.14.2.5 riz /* Now ready a context descriptor */
3622 1.1 dyoung TXD = (struct ixgbe_adv_tx_context_desc *) &txr->tx_base[ctxd];
3623 1.1 dyoung
3624 1.1 dyoung /*
3625 1.1 dyoung ** In advanced descriptors the vlan tag must
3626 1.14.2.5 riz ** be placed into the context descriptor. Hence
3627 1.14.2.5 riz ** we need to make one even if not doing offloads.
3628 1.1 dyoung */
3629 1.1 dyoung if ((mtag = VLAN_OUTPUT_TAG(ec, mp)) != NULL) {
3630 1.1 dyoung vtag = htole16(VLAN_TAG_VALUE(mtag) & 0xffff);
3631 1.1 dyoung vlan_macip_lens |= (vtag << IXGBE_ADVTXD_VLAN_SHIFT);
3632 1.14.2.5 riz } else if (offload == FALSE) /* ... no offload to do */
3633 1.1 dyoung return 0;
3634 1.1 dyoung
3635 1.1 dyoung /*
3636 1.1 dyoung * Determine where frame payload starts.
3637 1.1 dyoung * Jump over vlan headers if already present,
3638 1.1 dyoung * helpful for QinQ too.
3639 1.1 dyoung */
3640 1.1 dyoung KASSERT(mp->m_len >= offsetof(struct ether_vlan_header, evl_tag));
3641 1.1 dyoung eh = mtod(mp, struct ether_vlan_header *);
3642 1.1 dyoung if (eh->evl_encap_proto == htons(ETHERTYPE_VLAN)) {
3643 1.1 dyoung KASSERT(mp->m_len >= sizeof(struct ether_vlan_header));
3644 1.1 dyoung etype = ntohs(eh->evl_proto);
3645 1.1 dyoung ehdrlen = ETHER_HDR_LEN + ETHER_VLAN_ENCAP_LEN;
3646 1.1 dyoung } else {
3647 1.1 dyoung etype = ntohs(eh->evl_encap_proto);
3648 1.1 dyoung ehdrlen = ETHER_HDR_LEN;
3649 1.1 dyoung }
3650 1.1 dyoung
3651 1.1 dyoung /* Set the ether header length */
3652 1.1 dyoung vlan_macip_lens |= ehdrlen << IXGBE_ADVTXD_MACLEN_SHIFT;
3653 1.1 dyoung
3654 1.1 dyoung switch (etype) {
3655 1.1 dyoung case ETHERTYPE_IP:
3656 1.1 dyoung m_copydata(mp, ehdrlen, sizeof(ip), &ip);
3657 1.1 dyoung ip_hlen = ip.ip_hl << 2;
3658 1.1 dyoung ipproto = ip.ip_p;
3659 1.1 dyoung #if 0
3660 1.1 dyoung ip.ip_sum = 0;
3661 1.1 dyoung m_copyback(mp, ehdrlen, sizeof(ip), &ip);
3662 1.1 dyoung #else
3663 1.1 dyoung KASSERT((mp->m_pkthdr.csum_flags & M_CSUM_IPv4) == 0 ||
3664 1.1 dyoung ip.ip_sum == 0);
3665 1.1 dyoung #endif
3666 1.1 dyoung type_tucmd_mlhl |= IXGBE_ADVTXD_TUCMD_IPV4;
3667 1.1 dyoung break;
3668 1.1 dyoung case ETHERTYPE_IPV6:
3669 1.1 dyoung m_copydata(mp, ehdrlen, sizeof(ip6), &ip6);
3670 1.1 dyoung ip_hlen = sizeof(ip6);
3671 1.14.2.4 riz /* XXX-BZ this will go badly in case of ext hdrs. */
3672 1.1 dyoung ipproto = ip6.ip6_nxt;
3673 1.1 dyoung type_tucmd_mlhl |= IXGBE_ADVTXD_TUCMD_IPV6;
3674 1.1 dyoung break;
3675 1.1 dyoung default:
3676 1.1 dyoung break;
3677 1.1 dyoung }
3678 1.1 dyoung
3679 1.1 dyoung if ((mp->m_pkthdr.csum_flags & M_CSUM_IPv4) != 0)
3680 1.14.2.5 riz *olinfo_status |= IXGBE_TXD_POPTS_IXSM << 8;
3681 1.1 dyoung
3682 1.1 dyoung vlan_macip_lens |= ip_hlen;
3683 1.1 dyoung type_tucmd_mlhl |= IXGBE_ADVTXD_DCMD_DEXT | IXGBE_ADVTXD_DTYP_CTXT;
3684 1.1 dyoung
3685 1.1 dyoung if (mp->m_pkthdr.csum_flags & (M_CSUM_TCPv4|M_CSUM_TCPv6)) {
3686 1.1 dyoung type_tucmd_mlhl |= IXGBE_ADVTXD_TUCMD_L4T_TCP;
3687 1.14.2.5 riz *olinfo_status |= IXGBE_TXD_POPTS_TXSM << 8;
3688 1.1 dyoung KASSERT(ipproto == IPPROTO_TCP);
3689 1.1 dyoung } else if (mp->m_pkthdr.csum_flags & (M_CSUM_UDPv4|M_CSUM_UDPv6)) {
3690 1.1 dyoung type_tucmd_mlhl |= IXGBE_ADVTXD_TUCMD_L4T_UDP;
3691 1.14.2.5 riz *olinfo_status |= IXGBE_TXD_POPTS_TXSM << 8;
3692 1.1 dyoung KASSERT(ipproto == IPPROTO_UDP);
3693 1.1 dyoung }
3694 1.1 dyoung
3695 1.1 dyoung /* Now copy bits into descriptor */
3696 1.14.2.5 riz TXD->vlan_macip_lens = htole32(vlan_macip_lens);
3697 1.14.2.5 riz TXD->type_tucmd_mlhl = htole32(type_tucmd_mlhl);
3698 1.1 dyoung TXD->seqnum_seed = htole32(0);
3699 1.1 dyoung TXD->mss_l4len_idx = htole32(0);
3700 1.1 dyoung
3701 1.1 dyoung /* We've consumed the first desc, adjust counters */
3702 1.14.2.5 riz if (++ctxd == txr->num_desc)
3703 1.1 dyoung ctxd = 0;
3704 1.1 dyoung txr->next_avail_desc = ctxd;
3705 1.1 dyoung --txr->tx_avail;
3706 1.1 dyoung
3707 1.14.2.5 riz return 0;
3708 1.1 dyoung }
3709 1.1 dyoung
3710 1.1 dyoung /**********************************************************************
3711 1.1 dyoung *
3712 1.1 dyoung * Setup work for hardware segmentation offload (TSO) on
3713 1.1 dyoung * adapters using advanced tx descriptors
3714 1.1 dyoung *
3715 1.1 dyoung **********************************************************************/
3716 1.14.2.5 riz static int
3717 1.14.2.5 riz ixgbe_tso_setup(struct tx_ring *txr, struct mbuf *mp,
3718 1.14.2.5 riz u32 *cmd_type_len, u32 *olinfo_status)
3719 1.1 dyoung {
3720 1.1 dyoung struct m_tag *mtag;
3721 1.1 dyoung struct adapter *adapter = txr->adapter;
3722 1.1 dyoung struct ethercom *ec = &adapter->osdep.ec;
3723 1.1 dyoung struct ixgbe_adv_tx_context_desc *TXD;
3724 1.1 dyoung u32 vlan_macip_lens = 0, type_tucmd_mlhl = 0;
3725 1.14.2.5 riz u32 mss_l4len_idx = 0, paylen;
3726 1.14.2.4 riz u16 vtag = 0, eh_type;
3727 1.14.2.4 riz int ctxd, ehdrlen, ip_hlen, tcp_hlen;
3728 1.1 dyoung struct ether_vlan_header *eh;
3729 1.14.2.4 riz #ifdef INET6
3730 1.14.2.4 riz struct ip6_hdr *ip6;
3731 1.14.2.4 riz #endif
3732 1.14.2.4 riz #ifdef INET
3733 1.1 dyoung struct ip *ip;
3734 1.14.2.4 riz #endif
3735 1.1 dyoung struct tcphdr *th;
3736 1.1 dyoung
3737 1.1 dyoung
3738 1.1 dyoung /*
3739 1.1 dyoung * Determine where frame payload starts.
3740 1.1 dyoung * Jump over vlan headers if already present
3741 1.1 dyoung */
3742 1.1 dyoung eh = mtod(mp, struct ether_vlan_header *);
3743 1.14.2.4 riz if (eh->evl_encap_proto == htons(ETHERTYPE_VLAN)) {
3744 1.1 dyoung ehdrlen = ETHER_HDR_LEN + ETHER_VLAN_ENCAP_LEN;
3745 1.14.2.4 riz eh_type = eh->evl_proto;
3746 1.14.2.4 riz } else {
3747 1.1 dyoung ehdrlen = ETHER_HDR_LEN;
3748 1.14.2.4 riz eh_type = eh->evl_encap_proto;
3749 1.14.2.4 riz }
3750 1.1 dyoung
3751 1.14.2.4 riz switch (ntohs(eh_type)) {
3752 1.14.2.4 riz #ifdef INET6
3753 1.14.2.4 riz case ETHERTYPE_IPV6:
3754 1.14.2.4 riz ip6 = (struct ip6_hdr *)(mp->m_data + ehdrlen);
3755 1.14.2.4 riz /* XXX-BZ For now we do not pretend to support ext. hdrs. */
3756 1.14.2.4 riz if (ip6->ip6_nxt != IPPROTO_TCP)
3757 1.14.2.5 riz return (ENXIO);
3758 1.14.2.4 riz ip_hlen = sizeof(struct ip6_hdr);
3759 1.14.2.5 riz ip6 = (struct ip6_hdr *)(mp->m_data + ehdrlen);
3760 1.14.2.4 riz th = (struct tcphdr *)((char *)ip6 + ip_hlen);
3761 1.14.2.4 riz th->th_sum = in6_cksum_phdr(&ip6->ip6_src,
3762 1.14.2.4 riz &ip6->ip6_dst, 0, htonl(IPPROTO_TCP));
3763 1.14.2.4 riz type_tucmd_mlhl |= IXGBE_ADVTXD_TUCMD_IPV6;
3764 1.14.2.4 riz break;
3765 1.14.2.4 riz #endif
3766 1.14.2.4 riz #ifdef INET
3767 1.14.2.4 riz case ETHERTYPE_IP:
3768 1.14.2.4 riz ip = (struct ip *)(mp->m_data + ehdrlen);
3769 1.14.2.4 riz if (ip->ip_p != IPPROTO_TCP)
3770 1.14.2.5 riz return (ENXIO);
3771 1.14.2.4 riz ip->ip_sum = 0;
3772 1.14.2.4 riz ip_hlen = ip->ip_hl << 2;
3773 1.14.2.4 riz th = (struct tcphdr *)((char *)ip + ip_hlen);
3774 1.14.2.4 riz th->th_sum = in_cksum_phdr(ip->ip_src.s_addr,
3775 1.14.2.4 riz ip->ip_dst.s_addr, htons(IPPROTO_TCP));
3776 1.14.2.4 riz type_tucmd_mlhl |= IXGBE_ADVTXD_TUCMD_IPV4;
3777 1.14.2.4 riz /* Tell transmit desc to also do IPv4 checksum. */
3778 1.14.2.4 riz *olinfo_status |= IXGBE_TXD_POPTS_IXSM << 8;
3779 1.14.2.4 riz break;
3780 1.14.2.4 riz #endif
3781 1.14.2.4 riz default:
3782 1.14.2.4 riz panic("%s: CSUM_TSO but no supported IP version (0x%04x)",
3783 1.14.2.4 riz __func__, ntohs(eh_type));
3784 1.14.2.4 riz break;
3785 1.14.2.4 riz }
3786 1.1 dyoung
3787 1.1 dyoung ctxd = txr->next_avail_desc;
3788 1.1 dyoung TXD = (struct ixgbe_adv_tx_context_desc *) &txr->tx_base[ctxd];
3789 1.1 dyoung
3790 1.1 dyoung tcp_hlen = th->th_off << 2;
3791 1.1 dyoung
3792 1.1 dyoung /* This is used in the transmit desc in encap */
3793 1.14.2.5 riz paylen = mp->m_pkthdr.len - ehdrlen - ip_hlen - tcp_hlen;
3794 1.1 dyoung
3795 1.1 dyoung /* VLAN MACLEN IPLEN */
3796 1.1 dyoung if ((mtag = VLAN_OUTPUT_TAG(ec, mp)) != NULL) {
3797 1.1 dyoung vtag = htole16(VLAN_TAG_VALUE(mtag) & 0xffff);
3798 1.1 dyoung vlan_macip_lens |= (vtag << IXGBE_ADVTXD_VLAN_SHIFT);
3799 1.1 dyoung }
3800 1.1 dyoung
3801 1.1 dyoung vlan_macip_lens |= ehdrlen << IXGBE_ADVTXD_MACLEN_SHIFT;
3802 1.1 dyoung vlan_macip_lens |= ip_hlen;
3803 1.14.2.5 riz TXD->vlan_macip_lens = htole32(vlan_macip_lens);
3804 1.1 dyoung
3805 1.1 dyoung /* ADV DTYPE TUCMD */
3806 1.1 dyoung type_tucmd_mlhl |= IXGBE_ADVTXD_DCMD_DEXT | IXGBE_ADVTXD_DTYP_CTXT;
3807 1.1 dyoung type_tucmd_mlhl |= IXGBE_ADVTXD_TUCMD_L4T_TCP;
3808 1.14.2.5 riz TXD->type_tucmd_mlhl = htole32(type_tucmd_mlhl);
3809 1.1 dyoung
3810 1.1 dyoung /* MSS L4LEN IDX */
3811 1.1 dyoung mss_l4len_idx |= (mp->m_pkthdr.segsz << IXGBE_ADVTXD_MSS_SHIFT);
3812 1.1 dyoung mss_l4len_idx |= (tcp_hlen << IXGBE_ADVTXD_L4LEN_SHIFT);
3813 1.1 dyoung TXD->mss_l4len_idx = htole32(mss_l4len_idx);
3814 1.1 dyoung
3815 1.1 dyoung TXD->seqnum_seed = htole32(0);
3816 1.1 dyoung
3817 1.14.2.5 riz if (++ctxd == txr->num_desc)
3818 1.1 dyoung ctxd = 0;
3819 1.1 dyoung
3820 1.1 dyoung txr->tx_avail--;
3821 1.1 dyoung txr->next_avail_desc = ctxd;
3822 1.14.2.5 riz *cmd_type_len |= IXGBE_ADVTXD_DCMD_TSE;
3823 1.14.2.5 riz *olinfo_status |= IXGBE_TXD_POPTS_TXSM << 8;
3824 1.14.2.5 riz *olinfo_status |= paylen << IXGBE_ADVTXD_PAYLEN_SHIFT;
3825 1.14.2.5 riz ++txr->tso_tx.ev_count;
3826 1.14.2.5 riz return (0);
3827 1.1 dyoung }
3828 1.1 dyoung
3829 1.1 dyoung #ifdef IXGBE_FDIR
3830 1.1 dyoung /*
3831 1.1 dyoung ** This routine parses packet headers so that Flow
3832 1.1 dyoung ** Director can make a hashed filter table entry
3833 1.1 dyoung ** allowing traffic flows to be identified and kept
3834 1.1 dyoung ** on the same cpu. This would be a performance
3835 1.1 dyoung ** hit, but we only do it at IXGBE_FDIR_RATE of
3836 1.1 dyoung ** packets.
3837 1.1 dyoung */
3838 1.1 dyoung static void
3839 1.1 dyoung ixgbe_atr(struct tx_ring *txr, struct mbuf *mp)
3840 1.1 dyoung {
3841 1.1 dyoung struct adapter *adapter = txr->adapter;
3842 1.1 dyoung struct ix_queue *que;
3843 1.1 dyoung struct ip *ip;
3844 1.1 dyoung struct tcphdr *th;
3845 1.1 dyoung struct udphdr *uh;
3846 1.1 dyoung struct ether_vlan_header *eh;
3847 1.1 dyoung union ixgbe_atr_hash_dword input = {.dword = 0};
3848 1.1 dyoung union ixgbe_atr_hash_dword common = {.dword = 0};
3849 1.1 dyoung int ehdrlen, ip_hlen;
3850 1.1 dyoung u16 etype;
3851 1.1 dyoung
3852 1.1 dyoung eh = mtod(mp, struct ether_vlan_header *);
3853 1.1 dyoung if (eh->evl_encap_proto == htons(ETHERTYPE_VLAN)) {
3854 1.1 dyoung ehdrlen = ETHER_HDR_LEN + ETHER_VLAN_ENCAP_LEN;
3855 1.1 dyoung etype = eh->evl_proto;
3856 1.1 dyoung } else {
3857 1.1 dyoung ehdrlen = ETHER_HDR_LEN;
3858 1.1 dyoung etype = eh->evl_encap_proto;
3859 1.1 dyoung }
3860 1.1 dyoung
3861 1.1 dyoung /* Only handling IPv4 */
3862 1.1 dyoung if (etype != htons(ETHERTYPE_IP))
3863 1.1 dyoung return;
3864 1.1 dyoung
3865 1.1 dyoung ip = (struct ip *)(mp->m_data + ehdrlen);
3866 1.1 dyoung ip_hlen = ip->ip_hl << 2;
3867 1.1 dyoung
3868 1.1 dyoung /* check if we're UDP or TCP */
3869 1.1 dyoung switch (ip->ip_p) {
3870 1.1 dyoung case IPPROTO_TCP:
3871 1.1 dyoung th = (struct tcphdr *)((char *)ip + ip_hlen);
3872 1.1 dyoung /* src and dst are inverted */
3873 1.1 dyoung common.port.dst ^= th->th_sport;
3874 1.1 dyoung common.port.src ^= th->th_dport;
3875 1.1 dyoung input.formatted.flow_type ^= IXGBE_ATR_FLOW_TYPE_TCPV4;
3876 1.1 dyoung break;
3877 1.1 dyoung case IPPROTO_UDP:
3878 1.1 dyoung uh = (struct udphdr *)((char *)ip + ip_hlen);
3879 1.1 dyoung /* src and dst are inverted */
3880 1.1 dyoung common.port.dst ^= uh->uh_sport;
3881 1.1 dyoung common.port.src ^= uh->uh_dport;
3882 1.1 dyoung input.formatted.flow_type ^= IXGBE_ATR_FLOW_TYPE_UDPV4;
3883 1.1 dyoung break;
3884 1.1 dyoung default:
3885 1.1 dyoung return;
3886 1.1 dyoung }
3887 1.1 dyoung
3888 1.1 dyoung input.formatted.vlan_id = htobe16(mp->m_pkthdr.ether_vtag);
3889 1.1 dyoung if (mp->m_pkthdr.ether_vtag)
3890 1.1 dyoung common.flex_bytes ^= htons(ETHERTYPE_VLAN);
3891 1.1 dyoung else
3892 1.1 dyoung common.flex_bytes ^= etype;
3893 1.1 dyoung common.ip ^= ip->ip_src.s_addr ^ ip->ip_dst.s_addr;
3894 1.1 dyoung
3895 1.1 dyoung que = &adapter->queues[txr->me];
3896 1.1 dyoung /*
3897 1.1 dyoung ** This assumes the Rx queue and Tx
3898 1.1 dyoung ** queue are bound to the same CPU
3899 1.1 dyoung */
3900 1.1 dyoung ixgbe_fdir_add_signature_filter_82599(&adapter->hw,
3901 1.1 dyoung input, common, que->msix);
3902 1.1 dyoung }
3903 1.1 dyoung #endif /* IXGBE_FDIR */
3904 1.1 dyoung
3905 1.1 dyoung /**********************************************************************
3906 1.1 dyoung *
3907 1.1 dyoung * Examine each tx_buffer in the used queue. If the hardware is done
3908 1.1 dyoung * processing the packet then free associated resources. The
3909 1.1 dyoung * tx_buffer is put back on the free queue.
3910 1.1 dyoung *
3911 1.1 dyoung **********************************************************************/
3912 1.14.2.6 snj static void
3913 1.1 dyoung ixgbe_txeof(struct tx_ring *txr)
3914 1.1 dyoung {
3915 1.14.2.5 riz struct adapter *adapter = txr->adapter;
3916 1.14.2.5 riz struct ifnet *ifp = adapter->ifp;
3917 1.14.2.5 riz u32 work, processed = 0;
3918 1.14.2.5 riz u16 limit = txr->process_limit;
3919 1.14.2.5 riz struct ixgbe_tx_buf *buf;
3920 1.14.2.5 riz union ixgbe_adv_tx_desc *txd;
3921 1.1 dyoung struct timeval now, elapsed;
3922 1.1 dyoung
3923 1.1 dyoung KASSERT(mutex_owned(&txr->tx_mtx));
3924 1.1 dyoung
3925 1.14.2.3 martin #ifdef DEV_NETMAP
3926 1.14.2.3 martin if (ifp->if_capenable & IFCAP_NETMAP) {
3927 1.14.2.3 martin struct netmap_adapter *na = NA(ifp);
3928 1.14.2.3 martin struct netmap_kring *kring = &na->tx_rings[txr->me];
3929 1.14.2.5 riz txd = txr->tx_base;
3930 1.14.2.3 martin bus_dmamap_sync(txr->txdma.dma_tag, txr->txdma.dma_map,
3931 1.14.2.3 martin BUS_DMASYNC_POSTREAD);
3932 1.14.2.3 martin /*
3933 1.14.2.3 martin * In netmap mode, all the work is done in the context
3934 1.14.2.3 martin * of the client thread. Interrupt handlers only wake up
3935 1.14.2.3 martin * clients, which may be sleeping on individual rings
3936 1.14.2.3 martin * or on a global resource for all rings.
3937 1.14.2.3 martin * To implement tx interrupt mitigation, we wake up the client
3938 1.14.2.3 martin * thread roughly every half ring, even if the NIC interrupts
3939 1.14.2.3 martin * more frequently. This is implemented as follows:
3940 1.14.2.3 martin * - ixgbe_txsync() sets kring->nr_kflags with the index of
3941 1.14.2.3 martin * the slot that should wake up the thread (nkr_num_slots
3942 1.14.2.3 martin * means the user thread should not be woken up);
3943 1.14.2.3 martin * - the driver ignores tx interrupts unless netmap_mitigate=0
3944 1.14.2.3 martin * or the slot has the DD bit set.
3945 1.14.2.3 martin */
3946 1.14.2.3 martin if (!netmap_mitigate ||
3947 1.14.2.3 martin (kring->nr_kflags < kring->nkr_num_slots &&
3948 1.14.2.5 riz txd[kring->nr_kflags].wb.status & IXGBE_TXD_STAT_DD)) {
3949 1.14.2.6 snj netmap_tx_irq(ifp, txr->me);
3950 1.14.2.3 martin }
3951 1.14.2.6 snj return;
3952 1.14.2.3 martin }
3953 1.14.2.3 martin #endif /* DEV_NETMAP */
3954 1.14.2.3 martin
3955 1.14.2.5 riz if (txr->tx_avail == txr->num_desc) {
3956 1.1 dyoung txr->queue_status = IXGBE_QUEUE_IDLE;
3957 1.14.2.6 snj return;
3958 1.1 dyoung }
3959 1.1 dyoung
3960 1.14.2.5 riz /* Get work starting point */
3961 1.14.2.5 riz work = txr->next_to_clean;
3962 1.14.2.5 riz buf = &txr->tx_buffers[work];
3963 1.14.2.5 riz txd = &txr->tx_base[work];
3964 1.14.2.5 riz work -= txr->num_desc; /* The distance to ring end */
3965 1.1 dyoung ixgbe_dmamap_sync(txr->txdma.dma_tag, txr->txdma.dma_map,
3966 1.1 dyoung BUS_DMASYNC_POSTREAD);
3967 1.14.2.5 riz do {
3968 1.14.2.5 riz union ixgbe_adv_tx_desc *eop= buf->eop;
3969 1.14.2.5 riz if (eop == NULL) /* No work */
3970 1.14.2.5 riz break;
3971 1.1 dyoung
3972 1.14.2.5 riz if ((eop->wb.status & IXGBE_TXD_STAT_DD) == 0)
3973 1.14.2.5 riz break; /* I/O not complete */
3974 1.14.2.5 riz
3975 1.14.2.5 riz if (buf->m_head) {
3976 1.14.2.5 riz txr->bytes +=
3977 1.14.2.5 riz buf->m_head->m_pkthdr.len;
3978 1.14.2.5 riz bus_dmamap_sync(txr->txtag->dt_dmat,
3979 1.14.2.5 riz buf->map,
3980 1.14.2.5 riz 0, buf->m_head->m_pkthdr.len,
3981 1.14.2.5 riz BUS_DMASYNC_POSTWRITE);
3982 1.14.2.5 riz ixgbe_dmamap_unload(txr->txtag,
3983 1.14.2.5 riz buf->map);
3984 1.14.2.5 riz m_freem(buf->m_head);
3985 1.14.2.5 riz buf->m_head = NULL;
3986 1.14.2.5 riz /*
3987 1.14.2.5 riz * NetBSD: Don't override buf->map with NULL here.
3988 1.14.2.5 riz * It'll panic when a ring runs one lap around.
3989 1.14.2.5 riz */
3990 1.14.2.5 riz }
3991 1.14.2.5 riz buf->eop = NULL;
3992 1.14.2.5 riz ++txr->tx_avail;
3993 1.14.2.5 riz
3994 1.14.2.5 riz /* We clean the range if multi segment */
3995 1.14.2.5 riz while (txd != eop) {
3996 1.14.2.5 riz ++txd;
3997 1.14.2.5 riz ++buf;
3998 1.14.2.5 riz ++work;
3999 1.14.2.5 riz /* wrap the ring? */
4000 1.14.2.5 riz if (__predict_false(!work)) {
4001 1.14.2.5 riz work -= txr->num_desc;
4002 1.14.2.5 riz buf = txr->tx_buffers;
4003 1.14.2.5 riz txd = txr->tx_base;
4004 1.14.2.5 riz }
4005 1.14.2.5 riz if (buf->m_head) {
4006 1.1 dyoung txr->bytes +=
4007 1.14.2.5 riz buf->m_head->m_pkthdr.len;
4008 1.1 dyoung bus_dmamap_sync(txr->txtag->dt_dmat,
4009 1.14.2.5 riz buf->map,
4010 1.14.2.5 riz 0, buf->m_head->m_pkthdr.len,
4011 1.1 dyoung BUS_DMASYNC_POSTWRITE);
4012 1.14.2.5 riz ixgbe_dmamap_unload(txr->txtag,
4013 1.14.2.5 riz buf->map);
4014 1.14.2.5 riz m_freem(buf->m_head);
4015 1.14.2.5 riz buf->m_head = NULL;
4016 1.14.2.5 riz /*
4017 1.14.2.5 riz * NetBSD: Don't override buf->map with NULL
4018 1.14.2.5 riz * here. It'll panic when a ring runs one lap
4019 1.14.2.5 riz * around.
4020 1.14.2.5 riz */
4021 1.1 dyoung }
4022 1.14.2.5 riz ++txr->tx_avail;
4023 1.14.2.5 riz buf->eop = NULL;
4024 1.1 dyoung
4025 1.1 dyoung }
4026 1.1 dyoung ++txr->packets;
4027 1.14.2.5 riz ++processed;
4028 1.1 dyoung ++ifp->if_opackets;
4029 1.14.2.5 riz getmicrotime(&txr->watchdog_time);
4030 1.14.2.5 riz
4031 1.14.2.5 riz /* Try the next packet */
4032 1.14.2.5 riz ++txd;
4033 1.14.2.5 riz ++buf;
4034 1.14.2.5 riz ++work;
4035 1.14.2.5 riz /* reset with a wrap */
4036 1.14.2.5 riz if (__predict_false(!work)) {
4037 1.14.2.5 riz work -= txr->num_desc;
4038 1.14.2.5 riz buf = txr->tx_buffers;
4039 1.14.2.5 riz txd = txr->tx_base;
4040 1.14.2.5 riz }
4041 1.14.2.5 riz prefetch(txd);
4042 1.14.2.5 riz } while (__predict_true(--limit));
4043 1.14.2.5 riz
4044 1.1 dyoung ixgbe_dmamap_sync(txr->txdma.dma_tag, txr->txdma.dma_map,
4045 1.1 dyoung BUS_DMASYNC_PREREAD | BUS_DMASYNC_PREWRITE);
4046 1.1 dyoung
4047 1.14.2.5 riz work += txr->num_desc;
4048 1.14.2.5 riz txr->next_to_clean = work;
4049 1.1 dyoung
4050 1.1 dyoung /*
4051 1.1 dyoung ** Watchdog calculation, we know there's
4052 1.1 dyoung ** work outstanding or the first return
4053 1.1 dyoung ** would have been taken, so none processed
4054 1.1 dyoung ** for too long indicates a hang.
4055 1.1 dyoung */
4056 1.1 dyoung getmicrotime(&now);
4057 1.1 dyoung timersub(&now, &txr->watchdog_time, &elapsed);
4058 1.1 dyoung if (!processed && tvtohz(&elapsed) > IXGBE_WATCHDOG)
4059 1.1 dyoung txr->queue_status = IXGBE_QUEUE_HUNG;
4060 1.1 dyoung
4061 1.14.2.6 snj if (txr->tx_avail == txr->num_desc)
4062 1.14.2.4 riz txr->queue_status = IXGBE_QUEUE_IDLE;
4063 1.1 dyoung
4064 1.14.2.6 snj return;
4065 1.1 dyoung }
4066 1.1 dyoung
4067 1.1 dyoung /*********************************************************************
4068 1.1 dyoung *
4069 1.1 dyoung * Refresh mbuf buffers for RX descriptor rings
4070 1.1 dyoung * - now keeps its own state so discards due to resource
4071 1.1 dyoung * exhaustion are unnecessary, if an mbuf cannot be obtained
4072 1.1 dyoung * it just returns, keeping its placeholder, thus it can simply
4073 1.1 dyoung * be recalled to try again.
4074 1.1 dyoung *
4075 1.1 dyoung **********************************************************************/
4076 1.1 dyoung static void
4077 1.1 dyoung ixgbe_refresh_mbufs(struct rx_ring *rxr, int limit)
4078 1.1 dyoung {
4079 1.1 dyoung struct adapter *adapter = rxr->adapter;
4080 1.1 dyoung struct ixgbe_rx_buf *rxbuf;
4081 1.14.2.4 riz struct mbuf *mp;
4082 1.1 dyoung int i, j, error;
4083 1.1 dyoung bool refreshed = false;
4084 1.1 dyoung
4085 1.1 dyoung i = j = rxr->next_to_refresh;
4086 1.1 dyoung /* Control the loop with one beyond */
4087 1.14.2.5 riz if (++j == rxr->num_desc)
4088 1.1 dyoung j = 0;
4089 1.1 dyoung
4090 1.1 dyoung while (j != limit) {
4091 1.1 dyoung rxbuf = &rxr->rx_buffers[i];
4092 1.14.2.4 riz if (rxbuf->buf == NULL) {
4093 1.14.2.5 riz mp = ixgbe_getjcl(&adapter->jcl_head, M_NOWAIT,
4094 1.14.2.5 riz MT_DATA, M_PKTHDR, rxr->mbuf_sz);
4095 1.1 dyoung if (mp == NULL) {
4096 1.1 dyoung rxr->no_jmbuf.ev_count++;
4097 1.1 dyoung goto update;
4098 1.1 dyoung }
4099 1.14.2.5 riz if (adapter->max_frame_size <= (MCLBYTES - ETHER_ALIGN))
4100 1.14.2.5 riz m_adj(mp, ETHER_ALIGN);
4101 1.1 dyoung } else
4102 1.14.2.4 riz mp = rxbuf->buf;
4103 1.1 dyoung
4104 1.14.2.5 riz mp->m_pkthdr.len = mp->m_len = rxr->mbuf_sz;
4105 1.14.2.6 snj
4106 1.14.2.4 riz /* If we're dealing with an mbuf that was copied rather
4107 1.14.2.4 riz * than replaced, there's no need to go through busdma.
4108 1.14.2.4 riz */
4109 1.14.2.4 riz if ((rxbuf->flags & IXGBE_RX_COPY) == 0) {
4110 1.14.2.4 riz /* Get the memory mapping */
4111 1.14.2.5 riz error = bus_dmamap_load_mbuf(rxr->ptag->dt_dmat,
4112 1.14.2.5 riz rxbuf->pmap, mp, BUS_DMA_NOWAIT);
4113 1.14.2.4 riz if (error != 0) {
4114 1.14.2.4 riz printf("Refresh mbufs: payload dmamap load"
4115 1.14.2.4 riz " failure - %d\n", error);
4116 1.14.2.4 riz m_free(mp);
4117 1.14.2.4 riz rxbuf->buf = NULL;
4118 1.14.2.4 riz goto update;
4119 1.14.2.4 riz }
4120 1.14.2.4 riz rxbuf->buf = mp;
4121 1.14.2.5 riz bus_dmamap_sync(rxr->ptag->dt_dmat, rxbuf->pmap,
4122 1.14.2.4 riz 0, mp->m_pkthdr.len, BUS_DMASYNC_PREREAD);
4123 1.14.2.4 riz rxbuf->addr = rxr->rx_base[i].read.pkt_addr =
4124 1.14.2.5 riz htole64(rxbuf->pmap->dm_segs[0].ds_addr);
4125 1.14.2.4 riz } else {
4126 1.14.2.4 riz rxr->rx_base[i].read.pkt_addr = rxbuf->addr;
4127 1.14.2.4 riz rxbuf->flags &= ~IXGBE_RX_COPY;
4128 1.14.2.4 riz }
4129 1.1 dyoung
4130 1.1 dyoung refreshed = true;
4131 1.1 dyoung /* Next is precalculated */
4132 1.1 dyoung i = j;
4133 1.1 dyoung rxr->next_to_refresh = i;
4134 1.14.2.5 riz if (++j == rxr->num_desc)
4135 1.1 dyoung j = 0;
4136 1.1 dyoung }
4137 1.1 dyoung update:
4138 1.1 dyoung if (refreshed) /* Update hardware tail index */
4139 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw,
4140 1.1 dyoung IXGBE_RDT(rxr->me), rxr->next_to_refresh);
4141 1.1 dyoung return;
4142 1.1 dyoung }
4143 1.1 dyoung
4144 1.1 dyoung /*********************************************************************
4145 1.1 dyoung *
4146 1.1 dyoung * Allocate memory for rx_buffer structures. Since we use one
4147 1.1 dyoung * rx_buffer per received packet, the maximum number of rx_buffer's
4148 1.1 dyoung * that we'll need is equal to the number of receive descriptors
4149 1.1 dyoung * that we've allocated.
4150 1.1 dyoung *
4151 1.1 dyoung **********************************************************************/
4152 1.1 dyoung static int
4153 1.1 dyoung ixgbe_allocate_receive_buffers(struct rx_ring *rxr)
4154 1.1 dyoung {
4155 1.1 dyoung struct adapter *adapter = rxr->adapter;
4156 1.1 dyoung device_t dev = adapter->dev;
4157 1.1 dyoung struct ixgbe_rx_buf *rxbuf;
4158 1.1 dyoung int i, bsize, error;
4159 1.1 dyoung
4160 1.14.2.5 riz bsize = sizeof(struct ixgbe_rx_buf) * rxr->num_desc;
4161 1.1 dyoung if (!(rxr->rx_buffers =
4162 1.1 dyoung (struct ixgbe_rx_buf *) malloc(bsize,
4163 1.1 dyoung M_DEVBUF, M_NOWAIT | M_ZERO))) {
4164 1.1 dyoung aprint_error_dev(dev, "Unable to allocate rx_buffer memory\n");
4165 1.1 dyoung error = ENOMEM;
4166 1.1 dyoung goto fail;
4167 1.1 dyoung }
4168 1.1 dyoung
4169 1.1 dyoung if ((error = ixgbe_dma_tag_create(adapter->osdep.dmat, /* parent */
4170 1.1 dyoung 1, 0, /* alignment, bounds */
4171 1.1 dyoung MJUM16BYTES, /* maxsize */
4172 1.1 dyoung 1, /* nsegments */
4173 1.1 dyoung MJUM16BYTES, /* maxsegsize */
4174 1.1 dyoung 0, /* flags */
4175 1.14.2.5 riz &rxr->ptag))) {
4176 1.1 dyoung aprint_error_dev(dev, "Unable to create RX DMA tag\n");
4177 1.1 dyoung goto fail;
4178 1.1 dyoung }
4179 1.1 dyoung
4180 1.14.2.5 riz for (i = 0; i < rxr->num_desc; i++, rxbuf++) {
4181 1.1 dyoung rxbuf = &rxr->rx_buffers[i];
4182 1.14.2.5 riz error = ixgbe_dmamap_create(rxr->ptag,
4183 1.14.2.5 riz BUS_DMA_NOWAIT, &rxbuf->pmap);
4184 1.1 dyoung if (error) {
4185 1.14.2.4 riz aprint_error_dev(dev, "Unable to create RX dma map\n");
4186 1.1 dyoung goto fail;
4187 1.1 dyoung }
4188 1.1 dyoung }
4189 1.1 dyoung
4190 1.1 dyoung return (0);
4191 1.1 dyoung
4192 1.1 dyoung fail:
4193 1.1 dyoung /* Frees all, but can handle partial completion */
4194 1.1 dyoung ixgbe_free_receive_structures(adapter);
4195 1.1 dyoung return (error);
4196 1.1 dyoung }
4197 1.1 dyoung
4198 1.1 dyoung /*
4199 1.1 dyoung ** Used to detect a descriptor that has
4200 1.1 dyoung ** been merged by Hardware RSC.
4201 1.1 dyoung */
4202 1.1 dyoung static inline u32
4203 1.1 dyoung ixgbe_rsc_count(union ixgbe_adv_rx_desc *rx)
4204 1.1 dyoung {
4205 1.1 dyoung return (le32toh(rx->wb.lower.lo_dword.data) &
4206 1.1 dyoung IXGBE_RXDADV_RSCCNT_MASK) >> IXGBE_RXDADV_RSCCNT_SHIFT;
4207 1.1 dyoung }
4208 1.1 dyoung
4209 1.1 dyoung /*********************************************************************
4210 1.1 dyoung *
4211 1.1 dyoung * Initialize Hardware RSC (LRO) feature on 82599
4212 1.1 dyoung * for an RX ring, this is toggled by the LRO capability
4213 1.1 dyoung * even though it is transparent to the stack.
4214 1.1 dyoung *
4215 1.14.2.4 riz * NOTE: since this HW feature only works with IPV4 and
4216 1.14.2.4 riz * our testing has shown soft LRO to be as effective
4217 1.14.2.4 riz * I have decided to disable this by default.
4218 1.14.2.4 riz *
4219 1.1 dyoung **********************************************************************/
4220 1.1 dyoung static void
4221 1.1 dyoung ixgbe_setup_hw_rsc(struct rx_ring *rxr)
4222 1.1 dyoung {
4223 1.1 dyoung struct adapter *adapter = rxr->adapter;
4224 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
4225 1.1 dyoung u32 rscctrl, rdrxctl;
4226 1.1 dyoung
4227 1.14.2.4 riz /* If turning LRO/RSC off we need to disable it */
4228 1.14.2.4 riz if ((adapter->ifp->if_capenable & IFCAP_LRO) == 0) {
4229 1.14.2.4 riz rscctrl = IXGBE_READ_REG(hw, IXGBE_RSCCTL(rxr->me));
4230 1.14.2.4 riz rscctrl &= ~IXGBE_RSCCTL_RSCEN;
4231 1.14.2.4 riz return;
4232 1.14.2.4 riz }
4233 1.14.2.4 riz
4234 1.1 dyoung rdrxctl = IXGBE_READ_REG(hw, IXGBE_RDRXCTL);
4235 1.1 dyoung rdrxctl &= ~IXGBE_RDRXCTL_RSCFRSTSIZE;
4236 1.14.2.4 riz #ifdef DEV_NETMAP /* crcstrip is optional in netmap */
4237 1.14.2.4 riz if (adapter->ifp->if_capenable & IFCAP_NETMAP && !ix_crcstrip)
4238 1.14.2.4 riz #endif /* DEV_NETMAP */
4239 1.1 dyoung rdrxctl |= IXGBE_RDRXCTL_CRCSTRIP;
4240 1.1 dyoung rdrxctl |= IXGBE_RDRXCTL_RSCACKC;
4241 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RDRXCTL, rdrxctl);
4242 1.1 dyoung
4243 1.1 dyoung rscctrl = IXGBE_READ_REG(hw, IXGBE_RSCCTL(rxr->me));
4244 1.1 dyoung rscctrl |= IXGBE_RSCCTL_RSCEN;
4245 1.1 dyoung /*
4246 1.1 dyoung ** Limit the total number of descriptors that
4247 1.1 dyoung ** can be combined, so it does not exceed 64K
4248 1.1 dyoung */
4249 1.14.2.5 riz if (rxr->mbuf_sz == MCLBYTES)
4250 1.1 dyoung rscctrl |= IXGBE_RSCCTL_MAXDESC_16;
4251 1.14.2.5 riz else if (rxr->mbuf_sz == MJUMPAGESIZE)
4252 1.1 dyoung rscctrl |= IXGBE_RSCCTL_MAXDESC_8;
4253 1.14.2.5 riz else if (rxr->mbuf_sz == MJUM9BYTES)
4254 1.1 dyoung rscctrl |= IXGBE_RSCCTL_MAXDESC_4;
4255 1.1 dyoung else /* Using 16K cluster */
4256 1.1 dyoung rscctrl |= IXGBE_RSCCTL_MAXDESC_1;
4257 1.1 dyoung
4258 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RSCCTL(rxr->me), rscctrl);
4259 1.1 dyoung
4260 1.1 dyoung /* Enable TCP header recognition */
4261 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_PSRTYPE(0),
4262 1.1 dyoung (IXGBE_READ_REG(hw, IXGBE_PSRTYPE(0)) |
4263 1.1 dyoung IXGBE_PSRTYPE_TCPHDR));
4264 1.1 dyoung
4265 1.1 dyoung /* Disable RSC for ACK packets */
4266 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RSCDBU,
4267 1.1 dyoung (IXGBE_RSCDBU_RSCACKDIS | IXGBE_READ_REG(hw, IXGBE_RSCDBU)));
4268 1.1 dyoung
4269 1.1 dyoung rxr->hw_rsc = TRUE;
4270 1.1 dyoung }
4271 1.1 dyoung
4272 1.1 dyoung
4273 1.1 dyoung static void
4274 1.1 dyoung ixgbe_free_receive_ring(struct rx_ring *rxr)
4275 1.1 dyoung {
4276 1.1 dyoung struct ixgbe_rx_buf *rxbuf;
4277 1.1 dyoung int i;
4278 1.1 dyoung
4279 1.14.2.5 riz for (i = 0; i < rxr->num_desc; i++) {
4280 1.1 dyoung rxbuf = &rxr->rx_buffers[i];
4281 1.14.2.4 riz if (rxbuf->buf != NULL) {
4282 1.14.2.5 riz bus_dmamap_sync(rxr->ptag->dt_dmat, rxbuf->pmap,
4283 1.14.2.4 riz 0, rxbuf->buf->m_pkthdr.len,
4284 1.1 dyoung BUS_DMASYNC_POSTREAD);
4285 1.14.2.5 riz ixgbe_dmamap_unload(rxr->ptag, rxbuf->pmap);
4286 1.14.2.4 riz rxbuf->buf->m_flags |= M_PKTHDR;
4287 1.14.2.4 riz m_freem(rxbuf->buf);
4288 1.14.2.4 riz rxbuf->buf = NULL;
4289 1.14.2.6 snj rxbuf->flags = 0;
4290 1.1 dyoung }
4291 1.1 dyoung }
4292 1.1 dyoung }
4293 1.1 dyoung
4294 1.1 dyoung
4295 1.1 dyoung /*********************************************************************
4296 1.1 dyoung *
4297 1.1 dyoung * Initialize a receive ring and its buffers.
4298 1.1 dyoung *
4299 1.1 dyoung **********************************************************************/
4300 1.1 dyoung static int
4301 1.1 dyoung ixgbe_setup_receive_ring(struct rx_ring *rxr)
4302 1.1 dyoung {
4303 1.1 dyoung struct adapter *adapter;
4304 1.1 dyoung struct ixgbe_rx_buf *rxbuf;
4305 1.1 dyoung #ifdef LRO
4306 1.14.2.4 riz struct ifnet *ifp;
4307 1.1 dyoung struct lro_ctrl *lro = &rxr->lro;
4308 1.1 dyoung #endif /* LRO */
4309 1.1 dyoung int rsize, error = 0;
4310 1.14.2.3 martin #ifdef DEV_NETMAP
4311 1.14.2.3 martin struct netmap_adapter *na = NA(rxr->adapter->ifp);
4312 1.14.2.3 martin struct netmap_slot *slot;
4313 1.14.2.3 martin #endif /* DEV_NETMAP */
4314 1.1 dyoung
4315 1.1 dyoung adapter = rxr->adapter;
4316 1.14.2.4 riz #ifdef LRO
4317 1.1 dyoung ifp = adapter->ifp;
4318 1.14.2.4 riz #endif /* LRO */
4319 1.1 dyoung
4320 1.1 dyoung /* Clear the ring contents */
4321 1.1 dyoung IXGBE_RX_LOCK(rxr);
4322 1.14.2.3 martin #ifdef DEV_NETMAP
4323 1.14.2.3 martin /* same as in ixgbe_setup_transmit_ring() */
4324 1.14.2.3 martin slot = netmap_reset(na, NR_RX, rxr->me, 0);
4325 1.14.2.3 martin #endif /* DEV_NETMAP */
4326 1.1 dyoung rsize = roundup2(adapter->num_rx_desc *
4327 1.1 dyoung sizeof(union ixgbe_adv_rx_desc), DBA_ALIGN);
4328 1.1 dyoung bzero((void *)rxr->rx_base, rsize);
4329 1.14.2.5 riz /* Cache the size */
4330 1.14.2.5 riz rxr->mbuf_sz = adapter->rx_mbuf_sz;
4331 1.1 dyoung
4332 1.1 dyoung /* Free current RX buffer structs and their mbufs */
4333 1.1 dyoung ixgbe_free_receive_ring(rxr);
4334 1.1 dyoung
4335 1.14.2.2 martin IXGBE_RX_UNLOCK(rxr);
4336 1.14.2.2 martin
4337 1.1 dyoung /* Now reinitialize our supply of jumbo mbufs. The number
4338 1.1 dyoung * or size of jumbo mbufs may have changed.
4339 1.1 dyoung */
4340 1.14.2.5 riz ixgbe_jcl_reinit(&adapter->jcl_head, rxr->ptag->dt_dmat,
4341 1.1 dyoung 2 * adapter->num_rx_desc, adapter->rx_mbuf_sz);
4342 1.1 dyoung
4343 1.14.2.2 martin IXGBE_RX_LOCK(rxr);
4344 1.14.2.2 martin
4345 1.1 dyoung /* Now replenish the mbufs */
4346 1.14.2.5 riz for (int j = 0; j != rxr->num_desc; ++j) {
4347 1.14.2.4 riz struct mbuf *mp;
4348 1.1 dyoung
4349 1.1 dyoung rxbuf = &rxr->rx_buffers[j];
4350 1.14.2.3 martin #ifdef DEV_NETMAP
4351 1.14.2.3 martin /*
4352 1.14.2.3 martin * In netmap mode, fill the map and set the buffer
4353 1.14.2.3 martin * address in the NIC ring, considering the offset
4354 1.14.2.3 martin * between the netmap and NIC rings (see comment in
4355 1.14.2.3 martin * ixgbe_setup_transmit_ring() ). No need to allocate
4356 1.14.2.3 martin * an mbuf, so end the block with a continue;
4357 1.14.2.3 martin */
4358 1.14.2.3 martin if (slot) {
4359 1.14.2.4 riz int sj = netmap_idx_n2k(&na->rx_rings[rxr->me], j);
4360 1.14.2.3 martin uint64_t paddr;
4361 1.14.2.3 martin void *addr;
4362 1.14.2.3 martin
4363 1.14.2.6 snj addr = PNMB(na, slot + sj, &paddr);
4364 1.14.2.6 snj netmap_load_map(na, rxr->ptag, rxbuf->pmap, addr);
4365 1.14.2.6 snj /* Update descriptor and the cached value */
4366 1.14.2.3 martin rxr->rx_base[j].read.pkt_addr = htole64(paddr);
4367 1.14.2.6 snj rxbuf->addr = htole64(paddr);
4368 1.14.2.3 martin continue;
4369 1.14.2.3 martin }
4370 1.14.2.3 martin #endif /* DEV_NETMAP */
4371 1.14.2.6 snj rxbuf->flags = 0;
4372 1.14.2.5 riz rxbuf->buf = ixgbe_getjcl(&adapter->jcl_head, M_NOWAIT,
4373 1.1 dyoung MT_DATA, M_PKTHDR, adapter->rx_mbuf_sz);
4374 1.14.2.4 riz if (rxbuf->buf == NULL) {
4375 1.1 dyoung error = ENOBUFS;
4376 1.1 dyoung goto fail;
4377 1.1 dyoung }
4378 1.14.2.4 riz mp = rxbuf->buf;
4379 1.14.2.5 riz mp->m_pkthdr.len = mp->m_len = rxr->mbuf_sz;
4380 1.1 dyoung /* Get the memory mapping */
4381 1.14.2.5 riz error = bus_dmamap_load_mbuf(rxr->ptag->dt_dmat,
4382 1.14.2.5 riz rxbuf->pmap, mp, BUS_DMA_NOWAIT);
4383 1.1 dyoung if (error != 0)
4384 1.1 dyoung goto fail;
4385 1.14.2.5 riz bus_dmamap_sync(rxr->ptag->dt_dmat, rxbuf->pmap,
4386 1.1 dyoung 0, adapter->rx_mbuf_sz, BUS_DMASYNC_PREREAD);
4387 1.14.2.6 snj /* Update the descriptor and the cached value */
4388 1.1 dyoung rxr->rx_base[j].read.pkt_addr =
4389 1.14.2.5 riz htole64(rxbuf->pmap->dm_segs[0].ds_addr);
4390 1.14.2.6 snj rxbuf->addr = htole64(rxbuf->pmap->dm_segs[0].ds_addr);
4391 1.1 dyoung }
4392 1.1 dyoung
4393 1.1 dyoung
4394 1.1 dyoung /* Setup our descriptor indices */
4395 1.1 dyoung rxr->next_to_check = 0;
4396 1.1 dyoung rxr->next_to_refresh = 0;
4397 1.1 dyoung rxr->lro_enabled = FALSE;
4398 1.14.2.4 riz rxr->rx_copies.ev_count = 0;
4399 1.1 dyoung rxr->rx_bytes.ev_count = 0;
4400 1.14.2.4 riz rxr->vtag_strip = FALSE;
4401 1.1 dyoung
4402 1.1 dyoung ixgbe_dmamap_sync(rxr->rxdma.dma_tag, rxr->rxdma.dma_map,
4403 1.1 dyoung BUS_DMASYNC_PREREAD | BUS_DMASYNC_PREWRITE);
4404 1.1 dyoung
4405 1.1 dyoung /*
4406 1.1 dyoung ** Now set up the LRO interface:
4407 1.1 dyoung */
4408 1.14.2.4 riz if (ixgbe_rsc_enable)
4409 1.1 dyoung ixgbe_setup_hw_rsc(rxr);
4410 1.1 dyoung #ifdef LRO
4411 1.1 dyoung else if (ifp->if_capenable & IFCAP_LRO) {
4412 1.9 skrll device_t dev = adapter->dev;
4413 1.1 dyoung int err = tcp_lro_init(lro);
4414 1.1 dyoung if (err) {
4415 1.1 dyoung device_printf(dev, "LRO Initialization failed!\n");
4416 1.1 dyoung goto fail;
4417 1.1 dyoung }
4418 1.1 dyoung INIT_DEBUGOUT("RX Soft LRO Initialized\n");
4419 1.1 dyoung rxr->lro_enabled = TRUE;
4420 1.1 dyoung lro->ifp = adapter->ifp;
4421 1.1 dyoung }
4422 1.1 dyoung #endif /* LRO */
4423 1.1 dyoung
4424 1.1 dyoung IXGBE_RX_UNLOCK(rxr);
4425 1.1 dyoung return (0);
4426 1.1 dyoung
4427 1.1 dyoung fail:
4428 1.1 dyoung ixgbe_free_receive_ring(rxr);
4429 1.1 dyoung IXGBE_RX_UNLOCK(rxr);
4430 1.1 dyoung return (error);
4431 1.1 dyoung }
4432 1.1 dyoung
4433 1.1 dyoung /*********************************************************************
4434 1.1 dyoung *
4435 1.1 dyoung * Initialize all receive rings.
4436 1.1 dyoung *
4437 1.1 dyoung **********************************************************************/
4438 1.1 dyoung static int
4439 1.1 dyoung ixgbe_setup_receive_structures(struct adapter *adapter)
4440 1.1 dyoung {
4441 1.1 dyoung struct rx_ring *rxr = adapter->rx_rings;
4442 1.1 dyoung int j;
4443 1.1 dyoung
4444 1.1 dyoung for (j = 0; j < adapter->num_queues; j++, rxr++)
4445 1.1 dyoung if (ixgbe_setup_receive_ring(rxr))
4446 1.1 dyoung goto fail;
4447 1.1 dyoung
4448 1.1 dyoung return (0);
4449 1.1 dyoung fail:
4450 1.1 dyoung /*
4451 1.1 dyoung * Free RX buffers allocated so far, we will only handle
4452 1.1 dyoung * the rings that completed, the failing case will have
4453 1.1 dyoung * cleaned up for itself. 'j' failed, so its the terminus.
4454 1.1 dyoung */
4455 1.1 dyoung for (int i = 0; i < j; ++i) {
4456 1.1 dyoung rxr = &adapter->rx_rings[i];
4457 1.1 dyoung ixgbe_free_receive_ring(rxr);
4458 1.1 dyoung }
4459 1.1 dyoung
4460 1.1 dyoung return (ENOBUFS);
4461 1.1 dyoung }
4462 1.1 dyoung
4463 1.14.2.6 snj static void
4464 1.14.2.6 snj ixgbe_initialise_rss_mapping(struct adapter *adapter)
4465 1.14.2.6 snj {
4466 1.14.2.6 snj struct ixgbe_hw *hw = &adapter->hw;
4467 1.14.2.6 snj uint32_t reta;
4468 1.14.2.6 snj int i, j, queue_id;
4469 1.14.2.6 snj uint32_t rss_key[10];
4470 1.14.2.6 snj uint32_t mrqc;
4471 1.14.2.6 snj #ifdef RSS
4472 1.14.2.6 snj uint32_t rss_hash_config;
4473 1.14.2.6 snj #endif
4474 1.14.2.6 snj
4475 1.14.2.6 snj /* Setup RSS */
4476 1.14.2.6 snj reta = 0;
4477 1.14.2.6 snj
4478 1.14.2.6 snj #ifdef RSS
4479 1.14.2.6 snj /* Fetch the configured RSS key */
4480 1.14.2.6 snj rss_getkey((uint8_t *) &rss_key);
4481 1.14.2.6 snj #else
4482 1.14.2.6 snj /* set up random bits */
4483 1.14.2.6 snj cprng_fast(&rss_key, sizeof(rss_key));
4484 1.14.2.6 snj #endif
4485 1.14.2.6 snj
4486 1.14.2.6 snj /* Set up the redirection table */
4487 1.14.2.6 snj for (i = 0, j = 0; i < 128; i++, j++) {
4488 1.14.2.6 snj if (j == adapter->num_queues) j = 0;
4489 1.14.2.6 snj #ifdef RSS
4490 1.14.2.6 snj /*
4491 1.14.2.6 snj * Fetch the RSS bucket id for the given indirection entry.
4492 1.14.2.6 snj * Cap it at the number of configured buckets (which is
4493 1.14.2.6 snj * num_queues.)
4494 1.14.2.6 snj */
4495 1.14.2.6 snj queue_id = rss_get_indirection_to_bucket(i);
4496 1.14.2.6 snj queue_id = queue_id % adapter->num_queues;
4497 1.14.2.6 snj #else
4498 1.14.2.6 snj queue_id = (j * 0x11);
4499 1.14.2.6 snj #endif
4500 1.14.2.6 snj /*
4501 1.14.2.6 snj * The low 8 bits are for hash value (n+0);
4502 1.14.2.6 snj * The next 8 bits are for hash value (n+1), etc.
4503 1.14.2.6 snj */
4504 1.14.2.6 snj reta = reta >> 8;
4505 1.14.2.6 snj reta = reta | ( ((uint32_t) queue_id) << 24);
4506 1.14.2.6 snj if ((i & 3) == 3) {
4507 1.14.2.6 snj IXGBE_WRITE_REG(hw, IXGBE_RETA(i >> 2), reta);
4508 1.14.2.6 snj reta = 0;
4509 1.14.2.6 snj }
4510 1.14.2.6 snj }
4511 1.14.2.6 snj
4512 1.14.2.6 snj /* Now fill our hash function seeds */
4513 1.14.2.6 snj for (i = 0; i < 10; i++)
4514 1.14.2.6 snj IXGBE_WRITE_REG(hw, IXGBE_RSSRK(i), rss_key[i]);
4515 1.14.2.6 snj
4516 1.14.2.6 snj /* Perform hash on these packet types */
4517 1.14.2.6 snj #ifdef RSS
4518 1.14.2.6 snj mrqc = IXGBE_MRQC_RSSEN;
4519 1.14.2.6 snj rss_hash_config = rss_gethashconfig();
4520 1.14.2.6 snj if (rss_hash_config & RSS_HASHTYPE_RSS_IPV4)
4521 1.14.2.6 snj mrqc |= IXGBE_MRQC_RSS_FIELD_IPV4;
4522 1.14.2.6 snj if (rss_hash_config & RSS_HASHTYPE_RSS_TCP_IPV4)
4523 1.14.2.6 snj mrqc |= IXGBE_MRQC_RSS_FIELD_IPV4_TCP;
4524 1.14.2.6 snj if (rss_hash_config & RSS_HASHTYPE_RSS_IPV6)
4525 1.14.2.6 snj mrqc |= IXGBE_MRQC_RSS_FIELD_IPV6;
4526 1.14.2.6 snj if (rss_hash_config & RSS_HASHTYPE_RSS_TCP_IPV6)
4527 1.14.2.6 snj mrqc |= IXGBE_MRQC_RSS_FIELD_IPV6_TCP;
4528 1.14.2.6 snj if (rss_hash_config & RSS_HASHTYPE_RSS_IPV6_EX)
4529 1.14.2.6 snj mrqc |= IXGBE_MRQC_RSS_FIELD_IPV6_EX;
4530 1.14.2.6 snj if (rss_hash_config & RSS_HASHTYPE_RSS_TCP_IPV6_EX)
4531 1.14.2.6 snj mrqc |= IXGBE_MRQC_RSS_FIELD_IPV6_EX_TCP;
4532 1.14.2.6 snj if (rss_hash_config & RSS_HASHTYPE_RSS_UDP_IPV4)
4533 1.14.2.6 snj mrqc |= IXGBE_MRQC_RSS_FIELD_IPV4_UDP;
4534 1.14.2.6 snj if (rss_hash_config & RSS_HASHTYPE_RSS_UDP_IPV4_EX)
4535 1.14.2.6 snj device_printf(adapter->dev,
4536 1.14.2.6 snj "%s: RSS_HASHTYPE_RSS_UDP_IPV4_EX defined, "
4537 1.14.2.6 snj "but not supported\n", __func__);
4538 1.14.2.6 snj if (rss_hash_config & RSS_HASHTYPE_RSS_UDP_IPV6)
4539 1.14.2.6 snj mrqc |= IXGBE_MRQC_RSS_FIELD_IPV6_UDP;
4540 1.14.2.6 snj if (rss_hash_config & RSS_HASHTYPE_RSS_UDP_IPV6_EX)
4541 1.14.2.6 snj mrqc |= IXGBE_MRQC_RSS_FIELD_IPV6_EX_UDP;
4542 1.14.2.6 snj #else
4543 1.14.2.6 snj /*
4544 1.14.2.6 snj * Disable UDP - IP fragments aren't currently being handled
4545 1.14.2.6 snj * and so we end up with a mix of 2-tuple and 4-tuple
4546 1.14.2.6 snj * traffic.
4547 1.14.2.6 snj */
4548 1.14.2.6 snj mrqc = IXGBE_MRQC_RSSEN
4549 1.14.2.6 snj | IXGBE_MRQC_RSS_FIELD_IPV4
4550 1.14.2.6 snj | IXGBE_MRQC_RSS_FIELD_IPV4_TCP
4551 1.14.2.6 snj #if 0
4552 1.14.2.6 snj | IXGBE_MRQC_RSS_FIELD_IPV4_UDP
4553 1.14.2.6 snj #endif
4554 1.14.2.6 snj | IXGBE_MRQC_RSS_FIELD_IPV6_EX_TCP
4555 1.14.2.6 snj | IXGBE_MRQC_RSS_FIELD_IPV6_EX
4556 1.14.2.6 snj | IXGBE_MRQC_RSS_FIELD_IPV6
4557 1.14.2.6 snj | IXGBE_MRQC_RSS_FIELD_IPV6_TCP
4558 1.14.2.6 snj #if 0
4559 1.14.2.6 snj | IXGBE_MRQC_RSS_FIELD_IPV6_UDP
4560 1.14.2.6 snj | IXGBE_MRQC_RSS_FIELD_IPV6_EX_UDP
4561 1.14.2.6 snj #endif
4562 1.14.2.6 snj ;
4563 1.14.2.6 snj #endif /* RSS */
4564 1.14.2.6 snj IXGBE_WRITE_REG(hw, IXGBE_MRQC, mrqc);
4565 1.14.2.6 snj }
4566 1.14.2.6 snj
4567 1.14.2.6 snj
4568 1.1 dyoung /*********************************************************************
4569 1.1 dyoung *
4570 1.1 dyoung * Setup receive registers and features.
4571 1.1 dyoung *
4572 1.1 dyoung **********************************************************************/
4573 1.1 dyoung #define IXGBE_SRRCTL_BSIZEHDRSIZE_SHIFT 2
4574 1.1 dyoung
4575 1.14.2.3 martin #define BSIZEPKT_ROUNDUP ((1<<IXGBE_SRRCTL_BSIZEPKT_SHIFT)-1)
4576 1.14.2.3 martin
4577 1.1 dyoung static void
4578 1.1 dyoung ixgbe_initialize_receive_units(struct adapter *adapter)
4579 1.1 dyoung {
4580 1.1 dyoung int i;
4581 1.1 dyoung struct rx_ring *rxr = adapter->rx_rings;
4582 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
4583 1.1 dyoung struct ifnet *ifp = adapter->ifp;
4584 1.1 dyoung u32 bufsz, rxctrl, fctrl, srrctl, rxcsum;
4585 1.14.2.6 snj u32 hlreg;
4586 1.1 dyoung
4587 1.1 dyoung
4588 1.1 dyoung /*
4589 1.1 dyoung * Make sure receives are disabled while
4590 1.1 dyoung * setting up the descriptor ring
4591 1.1 dyoung */
4592 1.1 dyoung rxctrl = IXGBE_READ_REG(hw, IXGBE_RXCTRL);
4593 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RXCTRL,
4594 1.1 dyoung rxctrl & ~IXGBE_RXCTRL_RXEN);
4595 1.1 dyoung
4596 1.1 dyoung /* Enable broadcasts */
4597 1.1 dyoung fctrl = IXGBE_READ_REG(hw, IXGBE_FCTRL);
4598 1.1 dyoung fctrl |= IXGBE_FCTRL_BAM;
4599 1.1 dyoung fctrl |= IXGBE_FCTRL_DPF;
4600 1.1 dyoung fctrl |= IXGBE_FCTRL_PMCF;
4601 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_FCTRL, fctrl);
4602 1.1 dyoung
4603 1.1 dyoung /* Set for Jumbo Frames? */
4604 1.1 dyoung hlreg = IXGBE_READ_REG(hw, IXGBE_HLREG0);
4605 1.1 dyoung if (ifp->if_mtu > ETHERMTU)
4606 1.1 dyoung hlreg |= IXGBE_HLREG0_JUMBOEN;
4607 1.1 dyoung else
4608 1.1 dyoung hlreg &= ~IXGBE_HLREG0_JUMBOEN;
4609 1.14.2.4 riz #ifdef DEV_NETMAP
4610 1.14.2.4 riz /* crcstrip is conditional in netmap (in RDRXCTL too ?) */
4611 1.14.2.4 riz if (ifp->if_capenable & IFCAP_NETMAP && !ix_crcstrip)
4612 1.14.2.4 riz hlreg &= ~IXGBE_HLREG0_RXCRCSTRP;
4613 1.14.2.4 riz else
4614 1.14.2.4 riz hlreg |= IXGBE_HLREG0_RXCRCSTRP;
4615 1.14.2.4 riz #endif /* DEV_NETMAP */
4616 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_HLREG0, hlreg);
4617 1.1 dyoung
4618 1.14.2.4 riz bufsz = (adapter->rx_mbuf_sz +
4619 1.14.2.4 riz BSIZEPKT_ROUNDUP) >> IXGBE_SRRCTL_BSIZEPKT_SHIFT;
4620 1.1 dyoung
4621 1.1 dyoung for (i = 0; i < adapter->num_queues; i++, rxr++) {
4622 1.1 dyoung u64 rdba = rxr->rxdma.dma_paddr;
4623 1.1 dyoung
4624 1.1 dyoung /* Setup the Base and Length of the Rx Descriptor Ring */
4625 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RDBAL(i),
4626 1.1 dyoung (rdba & 0x00000000ffffffffULL));
4627 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RDBAH(i), (rdba >> 32));
4628 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RDLEN(i),
4629 1.1 dyoung adapter->num_rx_desc * sizeof(union ixgbe_adv_rx_desc));
4630 1.1 dyoung
4631 1.1 dyoung /* Set up the SRRCTL register */
4632 1.1 dyoung srrctl = IXGBE_READ_REG(hw, IXGBE_SRRCTL(i));
4633 1.1 dyoung srrctl &= ~IXGBE_SRRCTL_BSIZEHDR_MASK;
4634 1.1 dyoung srrctl &= ~IXGBE_SRRCTL_BSIZEPKT_MASK;
4635 1.1 dyoung srrctl |= bufsz;
4636 1.14.2.4 riz srrctl |= IXGBE_SRRCTL_DESCTYPE_ADV_ONEBUF;
4637 1.14.2.6 snj
4638 1.14.2.6 snj /*
4639 1.14.2.6 snj * Set DROP_EN iff we have no flow control and >1 queue.
4640 1.14.2.6 snj * Note that srrctl was cleared shortly before during reset,
4641 1.14.2.6 snj * so we do not need to clear the bit, but do it just in case
4642 1.14.2.6 snj * this code is moved elsewhere.
4643 1.14.2.6 snj */
4644 1.14.2.6 snj if (adapter->num_queues > 1 &&
4645 1.14.2.6 snj adapter->fc == ixgbe_fc_none) {
4646 1.14.2.6 snj srrctl |= IXGBE_SRRCTL_DROP_EN;
4647 1.14.2.6 snj } else {
4648 1.14.2.6 snj srrctl &= ~IXGBE_SRRCTL_DROP_EN;
4649 1.14.2.6 snj }
4650 1.14.2.6 snj
4651 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_SRRCTL(i), srrctl);
4652 1.1 dyoung
4653 1.1 dyoung /* Setup the HW Rx Head and Tail Descriptor Pointers */
4654 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RDH(i), 0);
4655 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RDT(i), 0);
4656 1.14.2.5 riz
4657 1.14.2.5 riz /* Set the processing limit */
4658 1.14.2.5 riz rxr->process_limit = ixgbe_rx_process_limit;
4659 1.1 dyoung }
4660 1.1 dyoung
4661 1.1 dyoung if (adapter->hw.mac.type != ixgbe_mac_82598EB) {
4662 1.1 dyoung u32 psrtype = IXGBE_PSRTYPE_TCPHDR |
4663 1.1 dyoung IXGBE_PSRTYPE_UDPHDR |
4664 1.1 dyoung IXGBE_PSRTYPE_IPV4HDR |
4665 1.1 dyoung IXGBE_PSRTYPE_IPV6HDR;
4666 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_PSRTYPE(0), psrtype);
4667 1.1 dyoung }
4668 1.1 dyoung
4669 1.1 dyoung rxcsum = IXGBE_READ_REG(hw, IXGBE_RXCSUM);
4670 1.1 dyoung
4671 1.14.2.6 snj ixgbe_initialise_rss_mapping(adapter);
4672 1.1 dyoung
4673 1.14.2.6 snj if (adapter->num_queues > 1) {
4674 1.1 dyoung /* RSS and RX IPP Checksum are mutually exclusive */
4675 1.1 dyoung rxcsum |= IXGBE_RXCSUM_PCSD;
4676 1.1 dyoung }
4677 1.1 dyoung
4678 1.1 dyoung if (ifp->if_capenable & IFCAP_RXCSUM)
4679 1.1 dyoung rxcsum |= IXGBE_RXCSUM_PCSD;
4680 1.1 dyoung
4681 1.1 dyoung if (!(rxcsum & IXGBE_RXCSUM_PCSD))
4682 1.1 dyoung rxcsum |= IXGBE_RXCSUM_IPPCSE;
4683 1.1 dyoung
4684 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RXCSUM, rxcsum);
4685 1.1 dyoung
4686 1.1 dyoung return;
4687 1.1 dyoung }
4688 1.1 dyoung
4689 1.1 dyoung /*********************************************************************
4690 1.1 dyoung *
4691 1.1 dyoung * Free all receive rings.
4692 1.1 dyoung *
4693 1.1 dyoung **********************************************************************/
4694 1.1 dyoung static void
4695 1.1 dyoung ixgbe_free_receive_structures(struct adapter *adapter)
4696 1.1 dyoung {
4697 1.1 dyoung struct rx_ring *rxr = adapter->rx_rings;
4698 1.1 dyoung
4699 1.14.2.6 snj INIT_DEBUGOUT("ixgbe_free_receive_structures: begin");
4700 1.14.2.6 snj
4701 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, rxr++) {
4702 1.1 dyoung #ifdef LRO
4703 1.1 dyoung struct lro_ctrl *lro = &rxr->lro;
4704 1.1 dyoung #endif /* LRO */
4705 1.1 dyoung ixgbe_free_receive_buffers(rxr);
4706 1.1 dyoung #ifdef LRO
4707 1.1 dyoung /* Free LRO memory */
4708 1.1 dyoung tcp_lro_free(lro);
4709 1.1 dyoung #endif /* LRO */
4710 1.1 dyoung /* Free the ring memory as well */
4711 1.1 dyoung ixgbe_dma_free(adapter, &rxr->rxdma);
4712 1.14.2.2 martin IXGBE_RX_LOCK_DESTROY(rxr);
4713 1.1 dyoung }
4714 1.1 dyoung
4715 1.1 dyoung free(adapter->rx_rings, M_DEVBUF);
4716 1.1 dyoung }
4717 1.1 dyoung
4718 1.1 dyoung
4719 1.1 dyoung /*********************************************************************
4720 1.1 dyoung *
4721 1.1 dyoung * Free receive ring data structures
4722 1.1 dyoung *
4723 1.1 dyoung **********************************************************************/
4724 1.1 dyoung static void
4725 1.1 dyoung ixgbe_free_receive_buffers(struct rx_ring *rxr)
4726 1.1 dyoung {
4727 1.1 dyoung struct adapter *adapter = rxr->adapter;
4728 1.1 dyoung struct ixgbe_rx_buf *rxbuf;
4729 1.1 dyoung
4730 1.14.2.6 snj INIT_DEBUGOUT("ixgbe_free_receive_buffers: begin");
4731 1.1 dyoung
4732 1.1 dyoung /* Cleanup any existing buffers */
4733 1.1 dyoung if (rxr->rx_buffers != NULL) {
4734 1.1 dyoung for (int i = 0; i < adapter->num_rx_desc; i++) {
4735 1.1 dyoung rxbuf = &rxr->rx_buffers[i];
4736 1.14.2.4 riz if (rxbuf->buf != NULL) {
4737 1.14.2.5 riz bus_dmamap_sync(rxr->ptag->dt_dmat,
4738 1.14.2.5 riz rxbuf->pmap, 0, rxbuf->buf->m_pkthdr.len,
4739 1.1 dyoung BUS_DMASYNC_POSTREAD);
4740 1.14.2.5 riz ixgbe_dmamap_unload(rxr->ptag, rxbuf->pmap);
4741 1.14.2.4 riz rxbuf->buf->m_flags |= M_PKTHDR;
4742 1.14.2.4 riz m_freem(rxbuf->buf);
4743 1.1 dyoung }
4744 1.14.2.4 riz rxbuf->buf = NULL;
4745 1.14.2.5 riz if (rxbuf->pmap != NULL) {
4746 1.14.2.5 riz ixgbe_dmamap_destroy(rxr->ptag, rxbuf->pmap);
4747 1.14.2.5 riz rxbuf->pmap = NULL;
4748 1.1 dyoung }
4749 1.1 dyoung }
4750 1.1 dyoung if (rxr->rx_buffers != NULL) {
4751 1.1 dyoung free(rxr->rx_buffers, M_DEVBUF);
4752 1.1 dyoung rxr->rx_buffers = NULL;
4753 1.1 dyoung }
4754 1.1 dyoung }
4755 1.1 dyoung
4756 1.14.2.5 riz if (rxr->ptag != NULL) {
4757 1.14.2.5 riz ixgbe_dma_tag_destroy(rxr->ptag);
4758 1.14.2.5 riz rxr->ptag = NULL;
4759 1.1 dyoung }
4760 1.1 dyoung
4761 1.1 dyoung return;
4762 1.1 dyoung }
4763 1.1 dyoung
4764 1.1 dyoung static __inline void
4765 1.1 dyoung ixgbe_rx_input(struct rx_ring *rxr, struct ifnet *ifp, struct mbuf *m, u32 ptype)
4766 1.1 dyoung {
4767 1.1 dyoung int s;
4768 1.1 dyoung
4769 1.9 skrll #ifdef LRO
4770 1.9 skrll struct adapter *adapter = ifp->if_softc;
4771 1.9 skrll struct ethercom *ec = &adapter->osdep.ec;
4772 1.1 dyoung
4773 1.1 dyoung /*
4774 1.14.2.4 riz * ATM LRO is only for IP/TCP packets and TCP checksum of the packet
4775 1.1 dyoung * should be computed by hardware. Also it should not have VLAN tag in
4776 1.14.2.4 riz * ethernet header. In case of IPv6 we do not yet support ext. hdrs.
4777 1.1 dyoung */
4778 1.1 dyoung if (rxr->lro_enabled &&
4779 1.1 dyoung (ec->ec_capenable & ETHERCAP_VLAN_HWTAGGING) != 0 &&
4780 1.1 dyoung (ptype & IXGBE_RXDADV_PKTTYPE_ETQF) == 0 &&
4781 1.14.2.4 riz ((ptype & (IXGBE_RXDADV_PKTTYPE_IPV4 | IXGBE_RXDADV_PKTTYPE_TCP)) ==
4782 1.14.2.4 riz (IXGBE_RXDADV_PKTTYPE_IPV4 | IXGBE_RXDADV_PKTTYPE_TCP) ||
4783 1.14.2.4 riz (ptype & (IXGBE_RXDADV_PKTTYPE_IPV6 | IXGBE_RXDADV_PKTTYPE_TCP)) ==
4784 1.14.2.4 riz (IXGBE_RXDADV_PKTTYPE_IPV6 | IXGBE_RXDADV_PKTTYPE_TCP)) &&
4785 1.1 dyoung (m->m_pkthdr.csum_flags & (CSUM_DATA_VALID | CSUM_PSEUDO_HDR)) ==
4786 1.1 dyoung (CSUM_DATA_VALID | CSUM_PSEUDO_HDR)) {
4787 1.1 dyoung /*
4788 1.1 dyoung * Send to the stack if:
4789 1.1 dyoung ** - LRO not enabled, or
4790 1.1 dyoung ** - no LRO resources, or
4791 1.1 dyoung ** - lro enqueue fails
4792 1.1 dyoung */
4793 1.1 dyoung if (rxr->lro.lro_cnt != 0)
4794 1.1 dyoung if (tcp_lro_rx(&rxr->lro, m, 0) == 0)
4795 1.1 dyoung return;
4796 1.1 dyoung }
4797 1.1 dyoung #endif /* LRO */
4798 1.1 dyoung
4799 1.1 dyoung IXGBE_RX_UNLOCK(rxr);
4800 1.1 dyoung
4801 1.1 dyoung s = splnet();
4802 1.1 dyoung /* Pass this up to any BPF listeners. */
4803 1.1 dyoung bpf_mtap(ifp, m);
4804 1.1 dyoung (*ifp->if_input)(ifp, m);
4805 1.1 dyoung splx(s);
4806 1.1 dyoung
4807 1.1 dyoung IXGBE_RX_LOCK(rxr);
4808 1.1 dyoung }
4809 1.1 dyoung
4810 1.1 dyoung static __inline void
4811 1.1 dyoung ixgbe_rx_discard(struct rx_ring *rxr, int i)
4812 1.1 dyoung {
4813 1.1 dyoung struct ixgbe_rx_buf *rbuf;
4814 1.1 dyoung
4815 1.1 dyoung rbuf = &rxr->rx_buffers[i];
4816 1.1 dyoung
4817 1.1 dyoung
4818 1.1 dyoung /*
4819 1.1 dyoung ** With advanced descriptors the writeback
4820 1.1 dyoung ** clobbers the buffer addrs, so its easier
4821 1.1 dyoung ** to just free the existing mbufs and take
4822 1.1 dyoung ** the normal refresh path to get new buffers
4823 1.1 dyoung ** and mapping.
4824 1.1 dyoung */
4825 1.14.2.6 snj
4826 1.14.2.6 snj if (rbuf->buf != NULL) {/* Partial chain ? */
4827 1.14.2.6 snj rbuf->fmp->m_flags |= M_PKTHDR;
4828 1.14.2.6 snj m_freem(rbuf->fmp);
4829 1.14.2.6 snj rbuf->fmp = NULL;
4830 1.14.2.6 snj rbuf->buf = NULL; /* rbuf->buf is part of fmp's chain */
4831 1.14.2.6 snj } else if (rbuf->buf) {
4832 1.14.2.4 riz m_free(rbuf->buf);
4833 1.14.2.4 riz rbuf->buf = NULL;
4834 1.1 dyoung }
4835 1.14.2.6 snj
4836 1.14.2.6 snj rbuf->flags = 0;
4837 1.14.2.6 snj
4838 1.1 dyoung return;
4839 1.1 dyoung }
4840 1.1 dyoung
4841 1.1 dyoung
4842 1.1 dyoung /*********************************************************************
4843 1.1 dyoung *
4844 1.1 dyoung * This routine executes in interrupt context. It replenishes
4845 1.1 dyoung * the mbufs in the descriptor and sends data which has been
4846 1.1 dyoung * dma'ed into host memory to upper layer.
4847 1.1 dyoung *
4848 1.1 dyoung * We loop at most count times if count is > 0, or until done if
4849 1.1 dyoung * count < 0.
4850 1.1 dyoung *
4851 1.1 dyoung * Return TRUE for more work, FALSE for all clean.
4852 1.1 dyoung *********************************************************************/
4853 1.1 dyoung static bool
4854 1.14.2.5 riz ixgbe_rxeof(struct ix_queue *que)
4855 1.1 dyoung {
4856 1.1 dyoung struct adapter *adapter = que->adapter;
4857 1.1 dyoung struct rx_ring *rxr = que->rxr;
4858 1.1 dyoung struct ifnet *ifp = adapter->ifp;
4859 1.1 dyoung #ifdef LRO
4860 1.1 dyoung struct lro_ctrl *lro = &rxr->lro;
4861 1.1 dyoung struct lro_entry *queued;
4862 1.1 dyoung #endif /* LRO */
4863 1.1 dyoung int i, nextp, processed = 0;
4864 1.1 dyoung u32 staterr = 0;
4865 1.14.2.5 riz u16 count = rxr->process_limit;
4866 1.1 dyoung union ixgbe_adv_rx_desc *cur;
4867 1.1 dyoung struct ixgbe_rx_buf *rbuf, *nbuf;
4868 1.14.2.6 snj #ifdef RSS
4869 1.14.2.6 snj u16 pkt_info;
4870 1.14.2.6 snj #endif
4871 1.1 dyoung
4872 1.1 dyoung IXGBE_RX_LOCK(rxr);
4873 1.1 dyoung
4874 1.14.2.3 martin #ifdef DEV_NETMAP
4875 1.14.2.5 riz /* Same as the txeof routine: wakeup clients on intr. */
4876 1.14.2.6 snj if (netmap_rx_irq(ifp, rxr->me, &processed)) {
4877 1.14.2.6 snj IXGBE_RX_UNLOCK(rxr);
4878 1.14.2.3 martin return (FALSE);
4879 1.14.2.6 snj }
4880 1.14.2.3 martin #endif /* DEV_NETMAP */
4881 1.14.2.6 snj
4882 1.1 dyoung for (i = rxr->next_to_check; count != 0;) {
4883 1.14.2.4 riz struct mbuf *sendmp, *mp;
4884 1.1 dyoung u32 rsc, ptype;
4885 1.14.2.4 riz u16 len;
4886 1.14.2.4 riz u16 vtag = 0;
4887 1.1 dyoung bool eop;
4888 1.1 dyoung
4889 1.1 dyoung /* Sync the ring. */
4890 1.1 dyoung ixgbe_dmamap_sync(rxr->rxdma.dma_tag, rxr->rxdma.dma_map,
4891 1.1 dyoung BUS_DMASYNC_POSTREAD | BUS_DMASYNC_POSTWRITE);
4892 1.1 dyoung
4893 1.1 dyoung cur = &rxr->rx_base[i];
4894 1.1 dyoung staterr = le32toh(cur->wb.upper.status_error);
4895 1.14.2.6 snj #ifdef RSS
4896 1.14.2.6 snj pkt_info = le16toh(cur->wb.lower.lo_dword.hs_rss.pkt_info);
4897 1.14.2.6 snj #endif
4898 1.1 dyoung
4899 1.1 dyoung if ((staterr & IXGBE_RXD_STAT_DD) == 0)
4900 1.1 dyoung break;
4901 1.1 dyoung if ((ifp->if_flags & IFF_RUNNING) == 0)
4902 1.1 dyoung break;
4903 1.1 dyoung
4904 1.1 dyoung count--;
4905 1.1 dyoung sendmp = NULL;
4906 1.1 dyoung nbuf = NULL;
4907 1.1 dyoung rsc = 0;
4908 1.1 dyoung cur->wb.upper.status_error = 0;
4909 1.1 dyoung rbuf = &rxr->rx_buffers[i];
4910 1.14.2.4 riz mp = rbuf->buf;
4911 1.1 dyoung
4912 1.14.2.4 riz len = le16toh(cur->wb.upper.length);
4913 1.1 dyoung ptype = le32toh(cur->wb.lower.lo_dword.data) &
4914 1.1 dyoung IXGBE_RXDADV_PKTTYPE_MASK;
4915 1.1 dyoung eop = ((staterr & IXGBE_RXD_STAT_EOP) != 0);
4916 1.1 dyoung
4917 1.1 dyoung /* Make sure bad packets are discarded */
4918 1.14.2.6 snj if (eop && (staterr & IXGBE_RXDADV_ERR_FRAME_ERR_MASK) != 0) {
4919 1.1 dyoung rxr->rx_discarded.ev_count++;
4920 1.1 dyoung ixgbe_rx_discard(rxr, i);
4921 1.1 dyoung goto next_desc;
4922 1.1 dyoung }
4923 1.1 dyoung
4924 1.1 dyoung /*
4925 1.1 dyoung ** On 82599 which supports a hardware
4926 1.1 dyoung ** LRO (called HW RSC), packets need
4927 1.1 dyoung ** not be fragmented across sequential
4928 1.1 dyoung ** descriptors, rather the next descriptor
4929 1.1 dyoung ** is indicated in bits of the descriptor.
4930 1.1 dyoung ** This also means that we might proceses
4931 1.1 dyoung ** more than one packet at a time, something
4932 1.1 dyoung ** that has never been true before, it
4933 1.1 dyoung ** required eliminating global chain pointers
4934 1.1 dyoung ** in favor of what we are doing here. -jfv
4935 1.1 dyoung */
4936 1.1 dyoung if (!eop) {
4937 1.1 dyoung /*
4938 1.1 dyoung ** Figure out the next descriptor
4939 1.1 dyoung ** of this frame.
4940 1.1 dyoung */
4941 1.1 dyoung if (rxr->hw_rsc == TRUE) {
4942 1.1 dyoung rsc = ixgbe_rsc_count(cur);
4943 1.1 dyoung rxr->rsc_num += (rsc - 1);
4944 1.1 dyoung }
4945 1.1 dyoung if (rsc) { /* Get hardware index */
4946 1.1 dyoung nextp = ((staterr &
4947 1.1 dyoung IXGBE_RXDADV_NEXTP_MASK) >>
4948 1.1 dyoung IXGBE_RXDADV_NEXTP_SHIFT);
4949 1.1 dyoung } else { /* Just sequential */
4950 1.1 dyoung nextp = i + 1;
4951 1.1 dyoung if (nextp == adapter->num_rx_desc)
4952 1.1 dyoung nextp = 0;
4953 1.1 dyoung }
4954 1.1 dyoung nbuf = &rxr->rx_buffers[nextp];
4955 1.1 dyoung prefetch(nbuf);
4956 1.1 dyoung }
4957 1.1 dyoung /*
4958 1.1 dyoung ** Rather than using the fmp/lmp global pointers
4959 1.1 dyoung ** we now keep the head of a packet chain in the
4960 1.1 dyoung ** buffer struct and pass this along from one
4961 1.1 dyoung ** descriptor to the next, until we get EOP.
4962 1.1 dyoung */
4963 1.14.2.4 riz mp->m_len = len;
4964 1.14.2.4 riz /*
4965 1.14.2.4 riz ** See if there is a stored head
4966 1.14.2.4 riz ** that determines what we are
4967 1.14.2.4 riz */
4968 1.14.2.4 riz sendmp = rbuf->fmp;
4969 1.14.2.4 riz if (sendmp != NULL) { /* secondary frag */
4970 1.14.2.4 riz rbuf->buf = rbuf->fmp = NULL;
4971 1.14.2.4 riz mp->m_flags &= ~M_PKTHDR;
4972 1.14.2.4 riz sendmp->m_pkthdr.len += mp->m_len;
4973 1.1 dyoung } else {
4974 1.1 dyoung /*
4975 1.14.2.4 riz * Optimize. This might be a small packet,
4976 1.14.2.4 riz * maybe just a TCP ACK. Do a fast copy that
4977 1.14.2.4 riz * is cache aligned into a new mbuf, and
4978 1.14.2.4 riz * leave the old mbuf+cluster for re-use.
4979 1.14.2.4 riz */
4980 1.14.2.4 riz if (eop && len <= IXGBE_RX_COPY_LEN) {
4981 1.14.2.5 riz sendmp = m_gethdr(M_NOWAIT, MT_DATA);
4982 1.14.2.4 riz if (sendmp != NULL) {
4983 1.14.2.4 riz sendmp->m_data +=
4984 1.14.2.4 riz IXGBE_RX_COPY_ALIGN;
4985 1.14.2.4 riz ixgbe_bcopy(mp->m_data,
4986 1.14.2.4 riz sendmp->m_data, len);
4987 1.14.2.4 riz sendmp->m_len = len;
4988 1.14.2.4 riz rxr->rx_copies.ev_count++;
4989 1.14.2.4 riz rbuf->flags |= IXGBE_RX_COPY;
4990 1.1 dyoung }
4991 1.1 dyoung }
4992 1.14.2.4 riz if (sendmp == NULL) {
4993 1.14.2.4 riz rbuf->buf = rbuf->fmp = NULL;
4994 1.14.2.4 riz sendmp = mp;
4995 1.14.2.4 riz }
4996 1.14.2.4 riz
4997 1.14.2.4 riz /* first desc of a non-ps chain */
4998 1.14.2.4 riz sendmp->m_flags |= M_PKTHDR;
4999 1.14.2.4 riz sendmp->m_pkthdr.len = mp->m_len;
5000 1.1 dyoung }
5001 1.1 dyoung ++processed;
5002 1.14.2.6 snj
5003 1.14.2.4 riz /* Pass the head pointer on */
5004 1.14.2.4 riz if (eop == 0) {
5005 1.14.2.4 riz nbuf->fmp = sendmp;
5006 1.14.2.4 riz sendmp = NULL;
5007 1.14.2.4 riz mp->m_next = nbuf->buf;
5008 1.14.2.4 riz } else { /* Sending this frame */
5009 1.1 dyoung sendmp->m_pkthdr.rcvif = ifp;
5010 1.1 dyoung ifp->if_ipackets++;
5011 1.1 dyoung rxr->rx_packets.ev_count++;
5012 1.1 dyoung /* capture data for AIM */
5013 1.1 dyoung rxr->bytes += sendmp->m_pkthdr.len;
5014 1.1 dyoung rxr->rx_bytes.ev_count += sendmp->m_pkthdr.len;
5015 1.14.2.4 riz /* Process vlan info */
5016 1.14.2.4 riz if ((rxr->vtag_strip) &&
5017 1.14.2.4 riz (staterr & IXGBE_RXD_STAT_VP))
5018 1.14.2.4 riz vtag = le16toh(cur->wb.upper.vlan);
5019 1.14.2.4 riz if (vtag) {
5020 1.14.2.4 riz VLAN_INPUT_TAG(ifp, sendmp, vtag,
5021 1.14.2.4 riz printf("%s: could not apply VLAN "
5022 1.14.2.4 riz "tag", __func__));
5023 1.14.2.4 riz }
5024 1.1 dyoung if ((ifp->if_capenable & IFCAP_RXCSUM) != 0) {
5025 1.1 dyoung ixgbe_rx_checksum(staterr, sendmp, ptype,
5026 1.1 dyoung &adapter->stats);
5027 1.1 dyoung }
5028 1.1 dyoung #if __FreeBSD_version >= 800000
5029 1.14.2.6 snj #ifdef RSS
5030 1.14.2.6 snj sendmp->m_pkthdr.flowid =
5031 1.14.2.6 snj le32toh(cur->wb.lower.hi_dword.rss);
5032 1.14.2.6 snj switch (pkt_info & IXGBE_RXDADV_RSSTYPE_MASK) {
5033 1.14.2.6 snj case IXGBE_RXDADV_RSSTYPE_IPV4_TCP:
5034 1.14.2.6 snj M_HASHTYPE_SET(sendmp, M_HASHTYPE_RSS_TCP_IPV4);
5035 1.14.2.6 snj break;
5036 1.14.2.6 snj case IXGBE_RXDADV_RSSTYPE_IPV4:
5037 1.14.2.6 snj M_HASHTYPE_SET(sendmp, M_HASHTYPE_RSS_IPV4);
5038 1.14.2.6 snj break;
5039 1.14.2.6 snj case IXGBE_RXDADV_RSSTYPE_IPV6_TCP:
5040 1.14.2.6 snj M_HASHTYPE_SET(sendmp, M_HASHTYPE_RSS_TCP_IPV6);
5041 1.14.2.6 snj break;
5042 1.14.2.6 snj case IXGBE_RXDADV_RSSTYPE_IPV6_EX:
5043 1.14.2.6 snj M_HASHTYPE_SET(sendmp, M_HASHTYPE_RSS_IPV6_EX);
5044 1.14.2.6 snj break;
5045 1.14.2.6 snj case IXGBE_RXDADV_RSSTYPE_IPV6:
5046 1.14.2.6 snj M_HASHTYPE_SET(sendmp, M_HASHTYPE_RSS_IPV6);
5047 1.14.2.6 snj break;
5048 1.14.2.6 snj case IXGBE_RXDADV_RSSTYPE_IPV6_TCP_EX:
5049 1.14.2.6 snj M_HASHTYPE_SET(sendmp, M_HASHTYPE_RSS_TCP_IPV6_EX);
5050 1.14.2.6 snj break;
5051 1.14.2.6 snj case IXGBE_RXDADV_RSSTYPE_IPV4_UDP:
5052 1.14.2.6 snj M_HASHTYPE_SET(sendmp, M_HASHTYPE_RSS_UDP_IPV4);
5053 1.14.2.6 snj break;
5054 1.14.2.6 snj case IXGBE_RXDADV_RSSTYPE_IPV6_UDP:
5055 1.14.2.6 snj M_HASHTYPE_SET(sendmp, M_HASHTYPE_RSS_UDP_IPV6);
5056 1.14.2.6 snj break;
5057 1.14.2.6 snj case IXGBE_RXDADV_RSSTYPE_IPV6_UDP_EX:
5058 1.14.2.6 snj M_HASHTYPE_SET(sendmp, M_HASHTYPE_RSS_UDP_IPV6_EX);
5059 1.14.2.6 snj break;
5060 1.14.2.6 snj default:
5061 1.14.2.6 snj /* XXX fallthrough */
5062 1.14.2.6 snj M_HASHTYPE_SET(sendmp, M_HASHTYPE_OPAQUE);
5063 1.14.2.6 snj break;
5064 1.14.2.6 snj }
5065 1.14.2.6 snj #else /* RSS */
5066 1.1 dyoung sendmp->m_pkthdr.flowid = que->msix;
5067 1.14.2.6 snj M_HASHTYPE_SET(sendmp, M_HASHTYPE_OPAQUE);
5068 1.14.2.6 snj #endif /* RSS */
5069 1.14.2.6 snj #endif /* FreeBSD_version */
5070 1.1 dyoung }
5071 1.1 dyoung next_desc:
5072 1.1 dyoung ixgbe_dmamap_sync(rxr->rxdma.dma_tag, rxr->rxdma.dma_map,
5073 1.1 dyoung BUS_DMASYNC_PREREAD | BUS_DMASYNC_PREWRITE);
5074 1.1 dyoung
5075 1.1 dyoung /* Advance our pointers to the next descriptor. */
5076 1.14.2.5 riz if (++i == rxr->num_desc)
5077 1.1 dyoung i = 0;
5078 1.1 dyoung
5079 1.1 dyoung /* Now send to the stack or do LRO */
5080 1.1 dyoung if (sendmp != NULL) {
5081 1.1 dyoung rxr->next_to_check = i;
5082 1.1 dyoung ixgbe_rx_input(rxr, ifp, sendmp, ptype);
5083 1.1 dyoung i = rxr->next_to_check;
5084 1.1 dyoung }
5085 1.1 dyoung
5086 1.1 dyoung /* Every 8 descriptors we go to refresh mbufs */
5087 1.1 dyoung if (processed == 8) {
5088 1.1 dyoung ixgbe_refresh_mbufs(rxr, i);
5089 1.1 dyoung processed = 0;
5090 1.1 dyoung }
5091 1.1 dyoung }
5092 1.1 dyoung
5093 1.1 dyoung /* Refresh any remaining buf structs */
5094 1.1 dyoung if (ixgbe_rx_unrefreshed(rxr))
5095 1.1 dyoung ixgbe_refresh_mbufs(rxr, i);
5096 1.1 dyoung
5097 1.1 dyoung rxr->next_to_check = i;
5098 1.1 dyoung
5099 1.1 dyoung #ifdef LRO
5100 1.1 dyoung /*
5101 1.1 dyoung * Flush any outstanding LRO work
5102 1.1 dyoung */
5103 1.1 dyoung while ((queued = SLIST_FIRST(&lro->lro_active)) != NULL) {
5104 1.1 dyoung SLIST_REMOVE_HEAD(&lro->lro_active, next);
5105 1.1 dyoung tcp_lro_flush(lro, queued);
5106 1.1 dyoung }
5107 1.1 dyoung #endif /* LRO */
5108 1.1 dyoung
5109 1.1 dyoung IXGBE_RX_UNLOCK(rxr);
5110 1.1 dyoung
5111 1.1 dyoung /*
5112 1.14.2.6 snj ** Still have cleaning to do?
5113 1.1 dyoung */
5114 1.14.2.6 snj if ((staterr & IXGBE_RXD_STAT_DD) != 0)
5115 1.1 dyoung return true;
5116 1.14.2.6 snj else
5117 1.14.2.6 snj return false;
5118 1.1 dyoung }
5119 1.1 dyoung
5120 1.1 dyoung
5121 1.1 dyoung /*********************************************************************
5122 1.1 dyoung *
5123 1.1 dyoung * Verify that the hardware indicated that the checksum is valid.
5124 1.1 dyoung * Inform the stack about the status of checksum so that stack
5125 1.1 dyoung * doesn't spend time verifying the checksum.
5126 1.1 dyoung *
5127 1.1 dyoung *********************************************************************/
5128 1.1 dyoung static void
5129 1.1 dyoung ixgbe_rx_checksum(u32 staterr, struct mbuf * mp, u32 ptype,
5130 1.1 dyoung struct ixgbe_hw_stats *stats)
5131 1.1 dyoung {
5132 1.1 dyoung u16 status = (u16) staterr;
5133 1.1 dyoung u8 errors = (u8) (staterr >> 24);
5134 1.9 skrll #if 0
5135 1.1 dyoung bool sctp = FALSE;
5136 1.1 dyoung
5137 1.1 dyoung if ((ptype & IXGBE_RXDADV_PKTTYPE_ETQF) == 0 &&
5138 1.1 dyoung (ptype & IXGBE_RXDADV_PKTTYPE_SCTP) != 0)
5139 1.1 dyoung sctp = TRUE;
5140 1.9 skrll #endif
5141 1.1 dyoung
5142 1.1 dyoung if (status & IXGBE_RXD_STAT_IPCS) {
5143 1.1 dyoung stats->ipcs.ev_count++;
5144 1.1 dyoung if (!(errors & IXGBE_RXD_ERR_IPE)) {
5145 1.1 dyoung /* IP Checksum Good */
5146 1.1 dyoung mp->m_pkthdr.csum_flags = M_CSUM_IPv4;
5147 1.1 dyoung
5148 1.1 dyoung } else {
5149 1.1 dyoung stats->ipcs_bad.ev_count++;
5150 1.1 dyoung mp->m_pkthdr.csum_flags = M_CSUM_IPv4|M_CSUM_IPv4_BAD;
5151 1.1 dyoung }
5152 1.1 dyoung }
5153 1.1 dyoung if (status & IXGBE_RXD_STAT_L4CS) {
5154 1.1 dyoung stats->l4cs.ev_count++;
5155 1.14.2.6 snj int type = M_CSUM_TCPv4|M_CSUM_TCPv6|M_CSUM_UDPv4|M_CSUM_UDPv6;
5156 1.1 dyoung if (!(errors & IXGBE_RXD_ERR_TCPE)) {
5157 1.1 dyoung mp->m_pkthdr.csum_flags |= type;
5158 1.1 dyoung } else {
5159 1.1 dyoung stats->l4cs_bad.ev_count++;
5160 1.1 dyoung mp->m_pkthdr.csum_flags |= type | M_CSUM_TCP_UDP_BAD;
5161 1.1 dyoung }
5162 1.1 dyoung }
5163 1.1 dyoung return;
5164 1.1 dyoung }
5165 1.1 dyoung
5166 1.1 dyoung
5167 1.1 dyoung #if 0 /* XXX Badly need to overhaul vlan(4) on NetBSD. */
5168 1.1 dyoung /*
5169 1.1 dyoung ** This routine is run via an vlan config EVENT,
5170 1.1 dyoung ** it enables us to use the HW Filter table since
5171 1.1 dyoung ** we can get the vlan id. This just creates the
5172 1.1 dyoung ** entry in the soft version of the VFTA, init will
5173 1.1 dyoung ** repopulate the real table.
5174 1.1 dyoung */
5175 1.1 dyoung static void
5176 1.1 dyoung ixgbe_register_vlan(void *arg, struct ifnet *ifp, u16 vtag)
5177 1.1 dyoung {
5178 1.1 dyoung struct adapter *adapter = ifp->if_softc;
5179 1.1 dyoung u16 index, bit;
5180 1.1 dyoung
5181 1.1 dyoung if (ifp->if_softc != arg) /* Not our event */
5182 1.1 dyoung return;
5183 1.1 dyoung
5184 1.1 dyoung if ((vtag == 0) || (vtag > 4095)) /* Invalid */
5185 1.1 dyoung return;
5186 1.1 dyoung
5187 1.1 dyoung IXGBE_CORE_LOCK(adapter);
5188 1.1 dyoung index = (vtag >> 5) & 0x7F;
5189 1.1 dyoung bit = vtag & 0x1F;
5190 1.1 dyoung adapter->shadow_vfta[index] |= (1 << bit);
5191 1.14.2.6 snj ixgbe_setup_vlan_hw_support(adapter);
5192 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
5193 1.1 dyoung }
5194 1.1 dyoung
5195 1.1 dyoung /*
5196 1.1 dyoung ** This routine is run via an vlan
5197 1.1 dyoung ** unconfig EVENT, remove our entry
5198 1.1 dyoung ** in the soft vfta.
5199 1.1 dyoung */
5200 1.1 dyoung static void
5201 1.1 dyoung ixgbe_unregister_vlan(void *arg, struct ifnet *ifp, u16 vtag)
5202 1.1 dyoung {
5203 1.1 dyoung struct adapter *adapter = ifp->if_softc;
5204 1.1 dyoung u16 index, bit;
5205 1.1 dyoung
5206 1.1 dyoung if (ifp->if_softc != arg)
5207 1.1 dyoung return;
5208 1.1 dyoung
5209 1.1 dyoung if ((vtag == 0) || (vtag > 4095)) /* Invalid */
5210 1.1 dyoung return;
5211 1.1 dyoung
5212 1.1 dyoung IXGBE_CORE_LOCK(adapter);
5213 1.1 dyoung index = (vtag >> 5) & 0x7F;
5214 1.1 dyoung bit = vtag & 0x1F;
5215 1.1 dyoung adapter->shadow_vfta[index] &= ~(1 << bit);
5216 1.1 dyoung /* Re-init to load the changes */
5217 1.14.2.6 snj ixgbe_setup_vlan_hw_support(adapter);
5218 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
5219 1.1 dyoung }
5220 1.1 dyoung #endif
5221 1.1 dyoung
5222 1.1 dyoung static void
5223 1.1 dyoung ixgbe_setup_vlan_hw_support(struct adapter *adapter)
5224 1.1 dyoung {
5225 1.1 dyoung struct ethercom *ec = &adapter->osdep.ec;
5226 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
5227 1.14.2.4 riz struct rx_ring *rxr;
5228 1.1 dyoung u32 ctrl;
5229 1.1 dyoung
5230 1.14.2.6 snj
5231 1.1 dyoung /*
5232 1.1 dyoung ** We get here thru init_locked, meaning
5233 1.1 dyoung ** a soft reset, this has already cleared
5234 1.1 dyoung ** the VFTA and other state, so if there
5235 1.1 dyoung ** have been no vlan's registered do nothing.
5236 1.1 dyoung */
5237 1.1 dyoung if (!VLAN_ATTACHED(&adapter->osdep.ec)) {
5238 1.1 dyoung return;
5239 1.1 dyoung }
5240 1.1 dyoung
5241 1.14.2.6 snj /* Setup the queues for vlans */
5242 1.14.2.6 snj for (int i = 0; i < adapter->num_queues; i++) {
5243 1.14.2.6 snj rxr = &adapter->rx_rings[i];
5244 1.14.2.6 snj /* On 82599 the VLAN enable is per/queue in RXDCTL */
5245 1.14.2.6 snj if (hw->mac.type != ixgbe_mac_82598EB) {
5246 1.14.2.6 snj ctrl = IXGBE_READ_REG(hw, IXGBE_RXDCTL(i));
5247 1.14.2.6 snj ctrl |= IXGBE_RXDCTL_VME;
5248 1.14.2.6 snj IXGBE_WRITE_REG(hw, IXGBE_RXDCTL(i), ctrl);
5249 1.14.2.6 snj }
5250 1.14.2.6 snj rxr->vtag_strip = TRUE;
5251 1.14.2.6 snj }
5252 1.14.2.6 snj
5253 1.14.2.6 snj if ((ec->ec_capenable & ETHERCAP_VLAN_HWFILTER) == 0)
5254 1.14.2.6 snj return;
5255 1.1 dyoung /*
5256 1.1 dyoung ** A soft reset zero's out the VFTA, so
5257 1.1 dyoung ** we need to repopulate it now.
5258 1.1 dyoung */
5259 1.1 dyoung for (int i = 0; i < IXGBE_VFTA_SIZE; i++)
5260 1.1 dyoung if (adapter->shadow_vfta[i] != 0)
5261 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_VFTA(i),
5262 1.1 dyoung adapter->shadow_vfta[i]);
5263 1.1 dyoung
5264 1.1 dyoung ctrl = IXGBE_READ_REG(hw, IXGBE_VLNCTRL);
5265 1.1 dyoung /* Enable the Filter Table if enabled */
5266 1.1 dyoung if (ec->ec_capenable & ETHERCAP_VLAN_HWFILTER) {
5267 1.1 dyoung ctrl &= ~IXGBE_VLNCTRL_CFIEN;
5268 1.1 dyoung ctrl |= IXGBE_VLNCTRL_VFE;
5269 1.1 dyoung }
5270 1.1 dyoung if (hw->mac.type == ixgbe_mac_82598EB)
5271 1.1 dyoung ctrl |= IXGBE_VLNCTRL_VME;
5272 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_VLNCTRL, ctrl);
5273 1.1 dyoung }
5274 1.1 dyoung
5275 1.1 dyoung static void
5276 1.1 dyoung ixgbe_enable_intr(struct adapter *adapter)
5277 1.1 dyoung {
5278 1.14.2.5 riz struct ixgbe_hw *hw = &adapter->hw;
5279 1.14.2.5 riz struct ix_queue *que = adapter->queues;
5280 1.14.2.5 riz u32 mask, fwsm;
5281 1.1 dyoung
5282 1.14.2.5 riz mask = (IXGBE_EIMS_ENABLE_MASK & ~IXGBE_EIMS_RTX_QUEUE);
5283 1.1 dyoung /* Enable Fan Failure detection */
5284 1.1 dyoung if (hw->device_id == IXGBE_DEV_ID_82598AT)
5285 1.1 dyoung mask |= IXGBE_EIMS_GPI_SDP1;
5286 1.14.2.5 riz
5287 1.14.2.5 riz switch (adapter->hw.mac.type) {
5288 1.14.2.5 riz case ixgbe_mac_82599EB:
5289 1.14.2.5 riz mask |= IXGBE_EIMS_ECC;
5290 1.14.2.5 riz mask |= IXGBE_EIMS_GPI_SDP0;
5291 1.14.2.5 riz mask |= IXGBE_EIMS_GPI_SDP1;
5292 1.14.2.5 riz mask |= IXGBE_EIMS_GPI_SDP2;
5293 1.1 dyoung #ifdef IXGBE_FDIR
5294 1.14.2.5 riz mask |= IXGBE_EIMS_FLOW_DIR;
5295 1.1 dyoung #endif
5296 1.14.2.5 riz break;
5297 1.14.2.5 riz case ixgbe_mac_X540:
5298 1.14.2.5 riz mask |= IXGBE_EIMS_ECC;
5299 1.14.2.5 riz /* Detect if Thermal Sensor is enabled */
5300 1.14.2.5 riz fwsm = IXGBE_READ_REG(hw, IXGBE_FWSM);
5301 1.14.2.5 riz if (fwsm & IXGBE_FWSM_TS_ENABLED)
5302 1.14.2.5 riz mask |= IXGBE_EIMS_TS;
5303 1.14.2.5 riz #ifdef IXGBE_FDIR
5304 1.14.2.5 riz mask |= IXGBE_EIMS_FLOW_DIR;
5305 1.14.2.5 riz #endif
5306 1.14.2.5 riz /* falls through */
5307 1.14.2.5 riz default:
5308 1.14.2.5 riz break;
5309 1.1 dyoung }
5310 1.1 dyoung
5311 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIMS, mask);
5312 1.1 dyoung
5313 1.1 dyoung /* With RSS we use auto clear */
5314 1.1 dyoung if (adapter->msix_mem) {
5315 1.1 dyoung mask = IXGBE_EIMS_ENABLE_MASK;
5316 1.1 dyoung /* Don't autoclear Link */
5317 1.1 dyoung mask &= ~IXGBE_EIMS_OTHER;
5318 1.1 dyoung mask &= ~IXGBE_EIMS_LSC;
5319 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIAC, mask);
5320 1.1 dyoung }
5321 1.1 dyoung
5322 1.1 dyoung /*
5323 1.1 dyoung ** Now enable all queues, this is done separately to
5324 1.1 dyoung ** allow for handling the extended (beyond 32) MSIX
5325 1.1 dyoung ** vectors that can be used by 82599
5326 1.1 dyoung */
5327 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, que++)
5328 1.1 dyoung ixgbe_enable_queue(adapter, que->msix);
5329 1.1 dyoung
5330 1.1 dyoung IXGBE_WRITE_FLUSH(hw);
5331 1.1 dyoung
5332 1.1 dyoung return;
5333 1.1 dyoung }
5334 1.1 dyoung
5335 1.1 dyoung static void
5336 1.1 dyoung ixgbe_disable_intr(struct adapter *adapter)
5337 1.1 dyoung {
5338 1.1 dyoung if (adapter->msix_mem)
5339 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_EIAC, 0);
5340 1.1 dyoung if (adapter->hw.mac.type == ixgbe_mac_82598EB) {
5341 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_EIMC, ~0);
5342 1.1 dyoung } else {
5343 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_EIMC, 0xFFFF0000);
5344 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_EIMC_EX(0), ~0);
5345 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_EIMC_EX(1), ~0);
5346 1.1 dyoung }
5347 1.1 dyoung IXGBE_WRITE_FLUSH(&adapter->hw);
5348 1.1 dyoung return;
5349 1.1 dyoung }
5350 1.1 dyoung
5351 1.1 dyoung u16
5352 1.1 dyoung ixgbe_read_pci_cfg(struct ixgbe_hw *hw, u32 reg)
5353 1.1 dyoung {
5354 1.1 dyoung switch (reg % 4) {
5355 1.1 dyoung case 0:
5356 1.1 dyoung return pci_conf_read(hw->back->pc, hw->back->tag, reg) &
5357 1.1 dyoung __BITS(15, 0);
5358 1.1 dyoung case 2:
5359 1.1 dyoung return __SHIFTOUT(pci_conf_read(hw->back->pc, hw->back->tag,
5360 1.1 dyoung reg - 2), __BITS(31, 16));
5361 1.1 dyoung default:
5362 1.1 dyoung panic("%s: invalid register (%" PRIx32, __func__, reg);
5363 1.1 dyoung break;
5364 1.1 dyoung }
5365 1.1 dyoung }
5366 1.1 dyoung
5367 1.1 dyoung void
5368 1.1 dyoung ixgbe_write_pci_cfg(struct ixgbe_hw *hw, u32 reg, u16 value)
5369 1.1 dyoung {
5370 1.1 dyoung pcireg_t old;
5371 1.1 dyoung
5372 1.1 dyoung switch (reg % 4) {
5373 1.1 dyoung case 0:
5374 1.1 dyoung old = pci_conf_read(hw->back->pc, hw->back->tag, reg) &
5375 1.1 dyoung __BITS(31, 16);
5376 1.1 dyoung pci_conf_write(hw->back->pc, hw->back->tag, reg, value | old);
5377 1.1 dyoung break;
5378 1.1 dyoung case 2:
5379 1.1 dyoung old = pci_conf_read(hw->back->pc, hw->back->tag, reg - 2) &
5380 1.1 dyoung __BITS(15, 0);
5381 1.1 dyoung pci_conf_write(hw->back->pc, hw->back->tag, reg - 2,
5382 1.1 dyoung __SHIFTIN(value, __BITS(31, 16)) | old);
5383 1.1 dyoung break;
5384 1.1 dyoung default:
5385 1.1 dyoung panic("%s: invalid register (%" PRIx32, __func__, reg);
5386 1.1 dyoung break;
5387 1.1 dyoung }
5388 1.1 dyoung
5389 1.1 dyoung return;
5390 1.1 dyoung }
5391 1.1 dyoung
5392 1.1 dyoung /*
5393 1.14.2.6 snj ** Get the width and transaction speed of
5394 1.14.2.6 snj ** the slot this adapter is plugged into.
5395 1.14.2.6 snj */
5396 1.14.2.6 snj static void
5397 1.14.2.6 snj ixgbe_get_slot_info(struct ixgbe_hw *hw)
5398 1.14.2.6 snj {
5399 1.14.2.6 snj device_t dev = ((struct ixgbe_osdep *)hw->back)->dev;
5400 1.14.2.6 snj struct ixgbe_mac_info *mac = &hw->mac;
5401 1.14.2.6 snj u16 link;
5402 1.14.2.6 snj
5403 1.14.2.6 snj /* For most devices simply call the shared code routine */
5404 1.14.2.6 snj if (hw->device_id != IXGBE_DEV_ID_82599_SFP_SF_QP) {
5405 1.14.2.6 snj ixgbe_get_bus_info(hw);
5406 1.14.2.6 snj goto display;
5407 1.14.2.6 snj }
5408 1.14.2.6 snj
5409 1.14.2.6 snj /*
5410 1.14.2.6 snj ** For the Quad port adapter we need to parse back
5411 1.14.2.6 snj ** up the PCI tree to find the speed of the expansion
5412 1.14.2.6 snj ** slot into which this adapter is plugged. A bit more work.
5413 1.14.2.6 snj */
5414 1.14.2.6 snj dev = device_parent(device_parent(dev));
5415 1.14.2.6 snj #ifdef IXGBE_DEBUG
5416 1.14.2.6 snj device_printf(dev, "parent pcib = %x,%x,%x\n",
5417 1.14.2.6 snj pci_get_bus(dev), pci_get_slot(dev), pci_get_function(dev));
5418 1.14.2.6 snj #endif
5419 1.14.2.6 snj dev = device_parent(device_parent(dev));
5420 1.14.2.6 snj #ifdef IXGBE_DEBUG
5421 1.14.2.6 snj device_printf(dev, "slot pcib = %x,%x,%x\n",
5422 1.14.2.6 snj pci_get_bus(dev), pci_get_slot(dev), pci_get_function(dev));
5423 1.14.2.6 snj #endif
5424 1.14.2.6 snj /* Now get the PCI Express Capabilities offset */
5425 1.14.2.6 snj /* ...and read the Link Status Register */
5426 1.14.2.6 snj link = IXGBE_READ_PCIE_WORD(hw, IXGBE_PCI_LINK_STATUS);
5427 1.14.2.6 snj switch (link & IXGBE_PCI_LINK_WIDTH) {
5428 1.14.2.6 snj case IXGBE_PCI_LINK_WIDTH_1:
5429 1.14.2.6 snj hw->bus.width = ixgbe_bus_width_pcie_x1;
5430 1.14.2.6 snj break;
5431 1.14.2.6 snj case IXGBE_PCI_LINK_WIDTH_2:
5432 1.14.2.6 snj hw->bus.width = ixgbe_bus_width_pcie_x2;
5433 1.14.2.6 snj break;
5434 1.14.2.6 snj case IXGBE_PCI_LINK_WIDTH_4:
5435 1.14.2.6 snj hw->bus.width = ixgbe_bus_width_pcie_x4;
5436 1.14.2.6 snj break;
5437 1.14.2.6 snj case IXGBE_PCI_LINK_WIDTH_8:
5438 1.14.2.6 snj hw->bus.width = ixgbe_bus_width_pcie_x8;
5439 1.14.2.6 snj break;
5440 1.14.2.6 snj default:
5441 1.14.2.6 snj hw->bus.width = ixgbe_bus_width_unknown;
5442 1.14.2.6 snj break;
5443 1.14.2.6 snj }
5444 1.14.2.6 snj
5445 1.14.2.6 snj switch (link & IXGBE_PCI_LINK_SPEED) {
5446 1.14.2.6 snj case IXGBE_PCI_LINK_SPEED_2500:
5447 1.14.2.6 snj hw->bus.speed = ixgbe_bus_speed_2500;
5448 1.14.2.6 snj break;
5449 1.14.2.6 snj case IXGBE_PCI_LINK_SPEED_5000:
5450 1.14.2.6 snj hw->bus.speed = ixgbe_bus_speed_5000;
5451 1.14.2.6 snj break;
5452 1.14.2.6 snj case IXGBE_PCI_LINK_SPEED_8000:
5453 1.14.2.6 snj hw->bus.speed = ixgbe_bus_speed_8000;
5454 1.14.2.6 snj break;
5455 1.14.2.6 snj default:
5456 1.14.2.6 snj hw->bus.speed = ixgbe_bus_speed_unknown;
5457 1.14.2.6 snj break;
5458 1.14.2.6 snj }
5459 1.14.2.6 snj
5460 1.14.2.6 snj mac->ops.set_lan_id(hw);
5461 1.14.2.6 snj
5462 1.14.2.6 snj display:
5463 1.14.2.6 snj device_printf(dev,"PCI Express Bus: Speed %s %s\n",
5464 1.14.2.6 snj ((hw->bus.speed == ixgbe_bus_speed_8000) ? "8.0GT/s":
5465 1.14.2.6 snj (hw->bus.speed == ixgbe_bus_speed_5000) ? "5.0GT/s":
5466 1.14.2.6 snj (hw->bus.speed == ixgbe_bus_speed_2500) ? "2.5GT/s":"Unknown"),
5467 1.14.2.6 snj (hw->bus.width == ixgbe_bus_width_pcie_x8) ? "Width x8" :
5468 1.14.2.6 snj (hw->bus.width == ixgbe_bus_width_pcie_x4) ? "Width x4" :
5469 1.14.2.6 snj (hw->bus.width == ixgbe_bus_width_pcie_x1) ? "Width x1" :
5470 1.14.2.6 snj ("Unknown"));
5471 1.14.2.6 snj
5472 1.14.2.6 snj if ((hw->device_id != IXGBE_DEV_ID_82599_SFP_SF_QP) &&
5473 1.14.2.6 snj ((hw->bus.width <= ixgbe_bus_width_pcie_x4) &&
5474 1.14.2.6 snj (hw->bus.speed == ixgbe_bus_speed_2500))) {
5475 1.14.2.6 snj device_printf(dev, "PCI-Express bandwidth available"
5476 1.14.2.6 snj " for this card\n is not sufficient for"
5477 1.14.2.6 snj " optimal performance.\n");
5478 1.14.2.6 snj device_printf(dev, "For optimal performance a x8 "
5479 1.14.2.6 snj "PCIE, or x4 PCIE Gen2 slot is required.\n");
5480 1.14.2.6 snj }
5481 1.14.2.6 snj if ((hw->device_id == IXGBE_DEV_ID_82599_SFP_SF_QP) &&
5482 1.14.2.6 snj ((hw->bus.width <= ixgbe_bus_width_pcie_x8) &&
5483 1.14.2.6 snj (hw->bus.speed < ixgbe_bus_speed_8000))) {
5484 1.14.2.6 snj device_printf(dev, "PCI-Express bandwidth available"
5485 1.14.2.6 snj " for this card\n is not sufficient for"
5486 1.14.2.6 snj " optimal performance.\n");
5487 1.14.2.6 snj device_printf(dev, "For optimal performance a x8 "
5488 1.14.2.6 snj "PCIE Gen3 slot is required.\n");
5489 1.14.2.6 snj }
5490 1.14.2.6 snj
5491 1.14.2.6 snj return;
5492 1.14.2.6 snj }
5493 1.14.2.6 snj
5494 1.14.2.6 snj
5495 1.14.2.6 snj /*
5496 1.1 dyoung ** Setup the correct IVAR register for a particular MSIX interrupt
5497 1.1 dyoung ** (yes this is all very magic and confusing :)
5498 1.1 dyoung ** - entry is the register array entry
5499 1.1 dyoung ** - vector is the MSIX vector for this queue
5500 1.1 dyoung ** - type is RX/TX/MISC
5501 1.1 dyoung */
5502 1.1 dyoung static void
5503 1.1 dyoung ixgbe_set_ivar(struct adapter *adapter, u8 entry, u8 vector, s8 type)
5504 1.1 dyoung {
5505 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
5506 1.1 dyoung u32 ivar, index;
5507 1.1 dyoung
5508 1.1 dyoung vector |= IXGBE_IVAR_ALLOC_VAL;
5509 1.1 dyoung
5510 1.1 dyoung switch (hw->mac.type) {
5511 1.1 dyoung
5512 1.1 dyoung case ixgbe_mac_82598EB:
5513 1.1 dyoung if (type == -1)
5514 1.1 dyoung entry = IXGBE_IVAR_OTHER_CAUSES_INDEX;
5515 1.1 dyoung else
5516 1.1 dyoung entry += (type * 64);
5517 1.1 dyoung index = (entry >> 2) & 0x1F;
5518 1.1 dyoung ivar = IXGBE_READ_REG(hw, IXGBE_IVAR(index));
5519 1.1 dyoung ivar &= ~(0xFF << (8 * (entry & 0x3)));
5520 1.1 dyoung ivar |= (vector << (8 * (entry & 0x3)));
5521 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_IVAR(index), ivar);
5522 1.1 dyoung break;
5523 1.1 dyoung
5524 1.1 dyoung case ixgbe_mac_82599EB:
5525 1.14.2.4 riz case ixgbe_mac_X540:
5526 1.1 dyoung if (type == -1) { /* MISC IVAR */
5527 1.1 dyoung index = (entry & 1) * 8;
5528 1.1 dyoung ivar = IXGBE_READ_REG(hw, IXGBE_IVAR_MISC);
5529 1.1 dyoung ivar &= ~(0xFF << index);
5530 1.1 dyoung ivar |= (vector << index);
5531 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_IVAR_MISC, ivar);
5532 1.1 dyoung } else { /* RX/TX IVARS */
5533 1.1 dyoung index = (16 * (entry & 1)) + (8 * type);
5534 1.1 dyoung ivar = IXGBE_READ_REG(hw, IXGBE_IVAR(entry >> 1));
5535 1.1 dyoung ivar &= ~(0xFF << index);
5536 1.1 dyoung ivar |= (vector << index);
5537 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_IVAR(entry >> 1), ivar);
5538 1.1 dyoung }
5539 1.1 dyoung
5540 1.1 dyoung default:
5541 1.1 dyoung break;
5542 1.1 dyoung }
5543 1.1 dyoung }
5544 1.1 dyoung
5545 1.1 dyoung static void
5546 1.1 dyoung ixgbe_configure_ivars(struct adapter *adapter)
5547 1.1 dyoung {
5548 1.1 dyoung struct ix_queue *que = adapter->queues;
5549 1.1 dyoung u32 newitr;
5550 1.1 dyoung
5551 1.1 dyoung if (ixgbe_max_interrupt_rate > 0)
5552 1.14.2.3 martin newitr = (4000000 / ixgbe_max_interrupt_rate) & 0x0FF8;
5553 1.1 dyoung else
5554 1.1 dyoung newitr = 0;
5555 1.1 dyoung
5556 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, que++) {
5557 1.1 dyoung /* First the RX queue entry */
5558 1.1 dyoung ixgbe_set_ivar(adapter, i, que->msix, 0);
5559 1.1 dyoung /* ... and the TX */
5560 1.1 dyoung ixgbe_set_ivar(adapter, i, que->msix, 1);
5561 1.1 dyoung /* Set an Initial EITR value */
5562 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw,
5563 1.1 dyoung IXGBE_EITR(que->msix), newitr);
5564 1.1 dyoung }
5565 1.1 dyoung
5566 1.1 dyoung /* For the Link interrupt */
5567 1.1 dyoung ixgbe_set_ivar(adapter, 1, adapter->linkvec, -1);
5568 1.1 dyoung }
5569 1.1 dyoung
5570 1.1 dyoung /*
5571 1.1 dyoung ** ixgbe_sfp_probe - called in the local timer to
5572 1.1 dyoung ** determine if a port had optics inserted.
5573 1.1 dyoung */
5574 1.1 dyoung static bool ixgbe_sfp_probe(struct adapter *adapter)
5575 1.1 dyoung {
5576 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
5577 1.1 dyoung device_t dev = adapter->dev;
5578 1.1 dyoung bool result = FALSE;
5579 1.1 dyoung
5580 1.1 dyoung if ((hw->phy.type == ixgbe_phy_nl) &&
5581 1.1 dyoung (hw->phy.sfp_type == ixgbe_sfp_type_not_present)) {
5582 1.1 dyoung s32 ret = hw->phy.ops.identify_sfp(hw);
5583 1.1 dyoung if (ret)
5584 1.1 dyoung goto out;
5585 1.1 dyoung ret = hw->phy.ops.reset(hw);
5586 1.1 dyoung if (ret == IXGBE_ERR_SFP_NOT_SUPPORTED) {
5587 1.1 dyoung device_printf(dev,"Unsupported SFP+ module detected!");
5588 1.1 dyoung device_printf(dev, "Reload driver with supported module.\n");
5589 1.1 dyoung adapter->sfp_probe = FALSE;
5590 1.1 dyoung goto out;
5591 1.1 dyoung } else
5592 1.1 dyoung device_printf(dev,"SFP+ module detected!\n");
5593 1.1 dyoung /* We now have supported optics */
5594 1.1 dyoung adapter->sfp_probe = FALSE;
5595 1.1 dyoung /* Set the optics type so system reports correctly */
5596 1.1 dyoung ixgbe_setup_optics(adapter);
5597 1.1 dyoung result = TRUE;
5598 1.1 dyoung }
5599 1.1 dyoung out:
5600 1.1 dyoung return (result);
5601 1.1 dyoung }
5602 1.1 dyoung
5603 1.1 dyoung /*
5604 1.1 dyoung ** Tasklet handler for MSIX Link interrupts
5605 1.1 dyoung ** - do outside interrupt since it might sleep
5606 1.1 dyoung */
5607 1.1 dyoung static void
5608 1.1 dyoung ixgbe_handle_link(void *context)
5609 1.1 dyoung {
5610 1.1 dyoung struct adapter *adapter = context;
5611 1.1 dyoung
5612 1.13 christos if (ixgbe_check_link(&adapter->hw,
5613 1.13 christos &adapter->link_speed, &adapter->link_up, 0) == 0)
5614 1.13 christos ixgbe_update_link_status(adapter);
5615 1.1 dyoung }
5616 1.1 dyoung
5617 1.1 dyoung /*
5618 1.1 dyoung ** Tasklet for handling SFP module interrupts
5619 1.1 dyoung */
5620 1.1 dyoung static void
5621 1.1 dyoung ixgbe_handle_mod(void *context)
5622 1.1 dyoung {
5623 1.1 dyoung struct adapter *adapter = context;
5624 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
5625 1.1 dyoung device_t dev = adapter->dev;
5626 1.1 dyoung u32 err;
5627 1.1 dyoung
5628 1.1 dyoung err = hw->phy.ops.identify_sfp(hw);
5629 1.1 dyoung if (err == IXGBE_ERR_SFP_NOT_SUPPORTED) {
5630 1.1 dyoung device_printf(dev,
5631 1.1 dyoung "Unsupported SFP+ module type was detected.\n");
5632 1.1 dyoung return;
5633 1.1 dyoung }
5634 1.1 dyoung err = hw->mac.ops.setup_sfp(hw);
5635 1.1 dyoung if (err == IXGBE_ERR_SFP_NOT_SUPPORTED) {
5636 1.1 dyoung device_printf(dev,
5637 1.1 dyoung "Setup failure - unsupported SFP+ module type.\n");
5638 1.1 dyoung return;
5639 1.1 dyoung }
5640 1.1 dyoung softint_schedule(adapter->msf_si);
5641 1.1 dyoung return;
5642 1.1 dyoung }
5643 1.1 dyoung
5644 1.1 dyoung
5645 1.1 dyoung /*
5646 1.1 dyoung ** Tasklet for handling MSF (multispeed fiber) interrupts
5647 1.1 dyoung */
5648 1.1 dyoung static void
5649 1.1 dyoung ixgbe_handle_msf(void *context)
5650 1.1 dyoung {
5651 1.1 dyoung struct adapter *adapter = context;
5652 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
5653 1.1 dyoung u32 autoneg;
5654 1.1 dyoung bool negotiate;
5655 1.1 dyoung
5656 1.1 dyoung autoneg = hw->phy.autoneg_advertised;
5657 1.1 dyoung if ((!autoneg) && (hw->mac.ops.get_link_capabilities))
5658 1.1 dyoung hw->mac.ops.get_link_capabilities(hw, &autoneg, &negotiate);
5659 1.13 christos else
5660 1.13 christos negotiate = 0;
5661 1.1 dyoung if (hw->mac.ops.setup_link)
5662 1.14.2.5 riz hw->mac.ops.setup_link(hw, autoneg, TRUE);
5663 1.1 dyoung return;
5664 1.1 dyoung }
5665 1.1 dyoung
5666 1.1 dyoung #ifdef IXGBE_FDIR
5667 1.1 dyoung /*
5668 1.1 dyoung ** Tasklet for reinitializing the Flow Director filter table
5669 1.1 dyoung */
5670 1.1 dyoung static void
5671 1.1 dyoung ixgbe_reinit_fdir(void *context)
5672 1.1 dyoung {
5673 1.1 dyoung struct adapter *adapter = context;
5674 1.1 dyoung struct ifnet *ifp = adapter->ifp;
5675 1.1 dyoung
5676 1.1 dyoung if (adapter->fdir_reinit != 1) /* Shouldn't happen */
5677 1.1 dyoung return;
5678 1.1 dyoung ixgbe_reinit_fdir_tables_82599(&adapter->hw);
5679 1.1 dyoung adapter->fdir_reinit = 0;
5680 1.14.2.4 riz /* re-enable flow director interrupts */
5681 1.14.2.4 riz IXGBE_WRITE_REG(&adapter->hw, IXGBE_EIMS, IXGBE_EIMS_FLOW_DIR);
5682 1.1 dyoung /* Restart the interface */
5683 1.1 dyoung ifp->if_flags |= IFF_RUNNING;
5684 1.1 dyoung return;
5685 1.1 dyoung }
5686 1.1 dyoung #endif
5687 1.1 dyoung
5688 1.1 dyoung /**********************************************************************
5689 1.1 dyoung *
5690 1.1 dyoung * Update the board statistics counters.
5691 1.1 dyoung *
5692 1.1 dyoung **********************************************************************/
5693 1.1 dyoung static void
5694 1.1 dyoung ixgbe_update_stats_counters(struct adapter *adapter)
5695 1.1 dyoung {
5696 1.1 dyoung struct ifnet *ifp = adapter->ifp;
5697 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
5698 1.1 dyoung u32 missed_rx = 0, bprc, lxon, lxoff, total;
5699 1.1 dyoung u64 total_missed_rx = 0;
5700 1.14.2.4 riz uint64_t crcerrs, rlec;
5701 1.1 dyoung
5702 1.14.2.4 riz crcerrs = IXGBE_READ_REG(hw, IXGBE_CRCERRS);
5703 1.14.2.4 riz adapter->stats.crcerrs.ev_count += crcerrs;
5704 1.1 dyoung adapter->stats.illerrc.ev_count += IXGBE_READ_REG(hw, IXGBE_ILLERRC);
5705 1.1 dyoung adapter->stats.errbc.ev_count += IXGBE_READ_REG(hw, IXGBE_ERRBC);
5706 1.1 dyoung adapter->stats.mspdc.ev_count += IXGBE_READ_REG(hw, IXGBE_MSPDC);
5707 1.1 dyoung
5708 1.14.2.5 riz /*
5709 1.14.2.5 riz ** Note: these are for the 8 possible traffic classes,
5710 1.14.2.5 riz ** which in current implementation is unused,
5711 1.14.2.5 riz ** therefore only 0 should read real data.
5712 1.14.2.5 riz */
5713 1.1 dyoung for (int i = 0; i < __arraycount(adapter->stats.mpc); i++) {
5714 1.1 dyoung int j = i % adapter->num_queues;
5715 1.1 dyoung u32 mp;
5716 1.1 dyoung mp = IXGBE_READ_REG(hw, IXGBE_MPC(i));
5717 1.1 dyoung /* missed_rx tallies misses for the gprc workaround */
5718 1.1 dyoung missed_rx += mp;
5719 1.1 dyoung /* global total per queue */
5720 1.1 dyoung adapter->stats.mpc[j].ev_count += mp;
5721 1.1 dyoung /* Running comprehensive total for stats display */
5722 1.14.2.4 riz total_missed_rx += mp;
5723 1.14.2.5 riz if (hw->mac.type == ixgbe_mac_82598EB) {
5724 1.1 dyoung adapter->stats.rnbc[j] +=
5725 1.1 dyoung IXGBE_READ_REG(hw, IXGBE_RNBC(i));
5726 1.14.2.5 riz adapter->stats.qbtc[j].ev_count +=
5727 1.14.2.5 riz IXGBE_READ_REG(hw, IXGBE_QBTC(i));
5728 1.14.2.5 riz adapter->stats.qbrc[j].ev_count +=
5729 1.14.2.5 riz IXGBE_READ_REG(hw, IXGBE_QBRC(i));
5730 1.14.2.5 riz adapter->stats.pxonrxc[j].ev_count +=
5731 1.14.2.5 riz IXGBE_READ_REG(hw, IXGBE_PXONRXC(i));
5732 1.14.2.5 riz } else {
5733 1.14.2.5 riz adapter->stats.pxonrxc[j].ev_count +=
5734 1.14.2.5 riz IXGBE_READ_REG(hw, IXGBE_PXONRXCNT(i));
5735 1.14.2.5 riz }
5736 1.1 dyoung adapter->stats.pxontxc[j].ev_count +=
5737 1.1 dyoung IXGBE_READ_REG(hw, IXGBE_PXONTXC(i));
5738 1.1 dyoung adapter->stats.pxofftxc[j].ev_count +=
5739 1.1 dyoung IXGBE_READ_REG(hw, IXGBE_PXOFFTXC(i));
5740 1.1 dyoung adapter->stats.pxoffrxc[j].ev_count +=
5741 1.1 dyoung IXGBE_READ_REG(hw, IXGBE_PXOFFRXC(i));
5742 1.1 dyoung adapter->stats.pxon2offc[j].ev_count +=
5743 1.1 dyoung IXGBE_READ_REG(hw, IXGBE_PXON2OFFCNT(i));
5744 1.1 dyoung }
5745 1.1 dyoung for (int i = 0; i < __arraycount(adapter->stats.qprc); i++) {
5746 1.1 dyoung int j = i % adapter->num_queues;
5747 1.1 dyoung adapter->stats.qprc[j].ev_count += IXGBE_READ_REG(hw, IXGBE_QPRC(i));
5748 1.1 dyoung adapter->stats.qptc[j].ev_count += IXGBE_READ_REG(hw, IXGBE_QPTC(i));
5749 1.1 dyoung adapter->stats.qprdc[j].ev_count += IXGBE_READ_REG(hw, IXGBE_QPRDC(i));
5750 1.1 dyoung }
5751 1.1 dyoung adapter->stats.mlfc.ev_count += IXGBE_READ_REG(hw, IXGBE_MLFC);
5752 1.1 dyoung adapter->stats.mrfc.ev_count += IXGBE_READ_REG(hw, IXGBE_MRFC);
5753 1.14.2.4 riz rlec = IXGBE_READ_REG(hw, IXGBE_RLEC);
5754 1.14.2.4 riz adapter->stats.rlec.ev_count += rlec;
5755 1.1 dyoung
5756 1.1 dyoung /* Hardware workaround, gprc counts missed packets */
5757 1.1 dyoung adapter->stats.gprc.ev_count += IXGBE_READ_REG(hw, IXGBE_GPRC) - missed_rx;
5758 1.1 dyoung
5759 1.1 dyoung lxon = IXGBE_READ_REG(hw, IXGBE_LXONTXC);
5760 1.1 dyoung adapter->stats.lxontxc.ev_count += lxon;
5761 1.1 dyoung lxoff = IXGBE_READ_REG(hw, IXGBE_LXOFFTXC);
5762 1.1 dyoung adapter->stats.lxofftxc.ev_count += lxoff;
5763 1.1 dyoung total = lxon + lxoff;
5764 1.1 dyoung
5765 1.1 dyoung if (hw->mac.type != ixgbe_mac_82598EB) {
5766 1.1 dyoung adapter->stats.gorc.ev_count += IXGBE_READ_REG(hw, IXGBE_GORCL) +
5767 1.1 dyoung ((u64)IXGBE_READ_REG(hw, IXGBE_GORCH) << 32);
5768 1.1 dyoung adapter->stats.gotc.ev_count += IXGBE_READ_REG(hw, IXGBE_GOTCL) +
5769 1.1 dyoung ((u64)IXGBE_READ_REG(hw, IXGBE_GOTCH) << 32) - total * ETHER_MIN_LEN;
5770 1.1 dyoung adapter->stats.tor.ev_count += IXGBE_READ_REG(hw, IXGBE_TORL) +
5771 1.1 dyoung ((u64)IXGBE_READ_REG(hw, IXGBE_TORH) << 32);
5772 1.1 dyoung adapter->stats.lxonrxc.ev_count += IXGBE_READ_REG(hw, IXGBE_LXONRXCNT);
5773 1.1 dyoung adapter->stats.lxoffrxc.ev_count += IXGBE_READ_REG(hw, IXGBE_LXOFFRXCNT);
5774 1.1 dyoung } else {
5775 1.1 dyoung adapter->stats.lxonrxc.ev_count += IXGBE_READ_REG(hw, IXGBE_LXONRXC);
5776 1.1 dyoung adapter->stats.lxoffrxc.ev_count += IXGBE_READ_REG(hw, IXGBE_LXOFFRXC);
5777 1.1 dyoung /* 82598 only has a counter in the high register */
5778 1.1 dyoung adapter->stats.gorc.ev_count += IXGBE_READ_REG(hw, IXGBE_GORCH);
5779 1.1 dyoung adapter->stats.gotc.ev_count += IXGBE_READ_REG(hw, IXGBE_GOTCH) - total * ETHER_MIN_LEN;
5780 1.1 dyoung adapter->stats.tor.ev_count += IXGBE_READ_REG(hw, IXGBE_TORH);
5781 1.1 dyoung }
5782 1.1 dyoung
5783 1.1 dyoung /*
5784 1.1 dyoung * Workaround: mprc hardware is incorrectly counting
5785 1.1 dyoung * broadcasts, so for now we subtract those.
5786 1.1 dyoung */
5787 1.1 dyoung bprc = IXGBE_READ_REG(hw, IXGBE_BPRC);
5788 1.1 dyoung adapter->stats.bprc.ev_count += bprc;
5789 1.1 dyoung adapter->stats.mprc.ev_count += IXGBE_READ_REG(hw, IXGBE_MPRC) - ((hw->mac.type == ixgbe_mac_82598EB) ? bprc : 0);
5790 1.1 dyoung
5791 1.1 dyoung adapter->stats.prc64.ev_count += IXGBE_READ_REG(hw, IXGBE_PRC64);
5792 1.1 dyoung adapter->stats.prc127.ev_count += IXGBE_READ_REG(hw, IXGBE_PRC127);
5793 1.1 dyoung adapter->stats.prc255.ev_count += IXGBE_READ_REG(hw, IXGBE_PRC255);
5794 1.1 dyoung adapter->stats.prc511.ev_count += IXGBE_READ_REG(hw, IXGBE_PRC511);
5795 1.1 dyoung adapter->stats.prc1023.ev_count += IXGBE_READ_REG(hw, IXGBE_PRC1023);
5796 1.1 dyoung adapter->stats.prc1522.ev_count += IXGBE_READ_REG(hw, IXGBE_PRC1522);
5797 1.1 dyoung
5798 1.1 dyoung adapter->stats.gptc.ev_count += IXGBE_READ_REG(hw, IXGBE_GPTC) - total;
5799 1.1 dyoung adapter->stats.mptc.ev_count += IXGBE_READ_REG(hw, IXGBE_MPTC) - total;
5800 1.1 dyoung adapter->stats.ptc64.ev_count += IXGBE_READ_REG(hw, IXGBE_PTC64) - total;
5801 1.1 dyoung
5802 1.1 dyoung adapter->stats.ruc.ev_count += IXGBE_READ_REG(hw, IXGBE_RUC);
5803 1.1 dyoung adapter->stats.rfc.ev_count += IXGBE_READ_REG(hw, IXGBE_RFC);
5804 1.1 dyoung adapter->stats.roc.ev_count += IXGBE_READ_REG(hw, IXGBE_ROC);
5805 1.1 dyoung adapter->stats.rjc.ev_count += IXGBE_READ_REG(hw, IXGBE_RJC);
5806 1.1 dyoung adapter->stats.mngprc.ev_count += IXGBE_READ_REG(hw, IXGBE_MNGPRC);
5807 1.1 dyoung adapter->stats.mngpdc.ev_count += IXGBE_READ_REG(hw, IXGBE_MNGPDC);
5808 1.1 dyoung adapter->stats.mngptc.ev_count += IXGBE_READ_REG(hw, IXGBE_MNGPTC);
5809 1.1 dyoung adapter->stats.tpr.ev_count += IXGBE_READ_REG(hw, IXGBE_TPR);
5810 1.1 dyoung adapter->stats.tpt.ev_count += IXGBE_READ_REG(hw, IXGBE_TPT);
5811 1.1 dyoung adapter->stats.ptc127.ev_count += IXGBE_READ_REG(hw, IXGBE_PTC127);
5812 1.1 dyoung adapter->stats.ptc255.ev_count += IXGBE_READ_REG(hw, IXGBE_PTC255);
5813 1.1 dyoung adapter->stats.ptc511.ev_count += IXGBE_READ_REG(hw, IXGBE_PTC511);
5814 1.1 dyoung adapter->stats.ptc1023.ev_count += IXGBE_READ_REG(hw, IXGBE_PTC1023);
5815 1.1 dyoung adapter->stats.ptc1522.ev_count += IXGBE_READ_REG(hw, IXGBE_PTC1522);
5816 1.1 dyoung adapter->stats.bptc.ev_count += IXGBE_READ_REG(hw, IXGBE_BPTC);
5817 1.1 dyoung adapter->stats.xec.ev_count += IXGBE_READ_REG(hw, IXGBE_XEC);
5818 1.1 dyoung adapter->stats.fccrc.ev_count += IXGBE_READ_REG(hw, IXGBE_FCCRC);
5819 1.1 dyoung adapter->stats.fclast.ev_count += IXGBE_READ_REG(hw, IXGBE_FCLAST);
5820 1.1 dyoung
5821 1.1 dyoung /* Only read FCOE on 82599 */
5822 1.1 dyoung if (hw->mac.type != ixgbe_mac_82598EB) {
5823 1.1 dyoung adapter->stats.fcoerpdc.ev_count +=
5824 1.1 dyoung IXGBE_READ_REG(hw, IXGBE_FCOERPDC);
5825 1.1 dyoung adapter->stats.fcoeprc.ev_count +=
5826 1.1 dyoung IXGBE_READ_REG(hw, IXGBE_FCOEPRC);
5827 1.1 dyoung adapter->stats.fcoeptc.ev_count +=
5828 1.1 dyoung IXGBE_READ_REG(hw, IXGBE_FCOEPTC);
5829 1.1 dyoung adapter->stats.fcoedwrc.ev_count +=
5830 1.1 dyoung IXGBE_READ_REG(hw, IXGBE_FCOEDWRC);
5831 1.1 dyoung adapter->stats.fcoedwtc.ev_count +=
5832 1.1 dyoung IXGBE_READ_REG(hw, IXGBE_FCOEDWTC);
5833 1.1 dyoung }
5834 1.1 dyoung
5835 1.1 dyoung /* Fill out the OS statistics structure */
5836 1.14.2.4 riz /*
5837 1.14.2.4 riz * NetBSD: Don't override if_{i|o}{packets|bytes|mcasts} with
5838 1.14.2.4 riz * adapter->stats counters. It's required to make ifconfig -z
5839 1.14.2.4 riz * (SOICZIFDATA) work.
5840 1.14.2.4 riz */
5841 1.1 dyoung ifp->if_collisions = 0;
5842 1.14.2.5 riz
5843 1.1 dyoung /* Rx Errors */
5844 1.14.2.5 riz ifp->if_iqdrops += total_missed_rx;
5845 1.14.2.5 riz ifp->if_ierrors += crcerrs + rlec;
5846 1.1 dyoung }
5847 1.1 dyoung
5848 1.1 dyoung /** ixgbe_sysctl_tdh_handler - Handler function
5849 1.1 dyoung * Retrieves the TDH value from the hardware
5850 1.1 dyoung */
5851 1.1 dyoung static int
5852 1.1 dyoung ixgbe_sysctl_tdh_handler(SYSCTLFN_ARGS)
5853 1.1 dyoung {
5854 1.1 dyoung struct sysctlnode node;
5855 1.1 dyoung uint32_t val;
5856 1.1 dyoung struct tx_ring *txr;
5857 1.1 dyoung
5858 1.1 dyoung node = *rnode;
5859 1.1 dyoung txr = (struct tx_ring *)node.sysctl_data;
5860 1.1 dyoung if (txr == NULL)
5861 1.1 dyoung return 0;
5862 1.1 dyoung val = IXGBE_READ_REG(&txr->adapter->hw, IXGBE_TDH(txr->me));
5863 1.1 dyoung node.sysctl_data = &val;
5864 1.1 dyoung return sysctl_lookup(SYSCTLFN_CALL(&node));
5865 1.1 dyoung }
5866 1.1 dyoung
5867 1.1 dyoung /** ixgbe_sysctl_tdt_handler - Handler function
5868 1.1 dyoung * Retrieves the TDT value from the hardware
5869 1.1 dyoung */
5870 1.1 dyoung static int
5871 1.1 dyoung ixgbe_sysctl_tdt_handler(SYSCTLFN_ARGS)
5872 1.1 dyoung {
5873 1.1 dyoung struct sysctlnode node;
5874 1.1 dyoung uint32_t val;
5875 1.1 dyoung struct tx_ring *txr;
5876 1.1 dyoung
5877 1.1 dyoung node = *rnode;
5878 1.1 dyoung txr = (struct tx_ring *)node.sysctl_data;
5879 1.1 dyoung if (txr == NULL)
5880 1.1 dyoung return 0;
5881 1.1 dyoung val = IXGBE_READ_REG(&txr->adapter->hw, IXGBE_TDT(txr->me));
5882 1.1 dyoung node.sysctl_data = &val;
5883 1.1 dyoung return sysctl_lookup(SYSCTLFN_CALL(&node));
5884 1.1 dyoung }
5885 1.1 dyoung
5886 1.1 dyoung /** ixgbe_sysctl_rdh_handler - Handler function
5887 1.1 dyoung * Retrieves the RDH value from the hardware
5888 1.1 dyoung */
5889 1.1 dyoung static int
5890 1.1 dyoung ixgbe_sysctl_rdh_handler(SYSCTLFN_ARGS)
5891 1.1 dyoung {
5892 1.1 dyoung struct sysctlnode node;
5893 1.1 dyoung uint32_t val;
5894 1.1 dyoung struct rx_ring *rxr;
5895 1.1 dyoung
5896 1.1 dyoung node = *rnode;
5897 1.1 dyoung rxr = (struct rx_ring *)node.sysctl_data;
5898 1.1 dyoung if (rxr == NULL)
5899 1.1 dyoung return 0;
5900 1.1 dyoung val = IXGBE_READ_REG(&rxr->adapter->hw, IXGBE_RDH(rxr->me));
5901 1.1 dyoung node.sysctl_data = &val;
5902 1.1 dyoung return sysctl_lookup(SYSCTLFN_CALL(&node));
5903 1.1 dyoung }
5904 1.1 dyoung
5905 1.1 dyoung /** ixgbe_sysctl_rdt_handler - Handler function
5906 1.1 dyoung * Retrieves the RDT value from the hardware
5907 1.1 dyoung */
5908 1.1 dyoung static int
5909 1.1 dyoung ixgbe_sysctl_rdt_handler(SYSCTLFN_ARGS)
5910 1.1 dyoung {
5911 1.1 dyoung struct sysctlnode node;
5912 1.1 dyoung uint32_t val;
5913 1.1 dyoung struct rx_ring *rxr;
5914 1.1 dyoung
5915 1.1 dyoung node = *rnode;
5916 1.1 dyoung rxr = (struct rx_ring *)node.sysctl_data;
5917 1.1 dyoung if (rxr == NULL)
5918 1.1 dyoung return 0;
5919 1.1 dyoung val = IXGBE_READ_REG(&rxr->adapter->hw, IXGBE_RDT(rxr->me));
5920 1.1 dyoung node.sysctl_data = &val;
5921 1.1 dyoung return sysctl_lookup(SYSCTLFN_CALL(&node));
5922 1.1 dyoung }
5923 1.1 dyoung
5924 1.1 dyoung static int
5925 1.1 dyoung ixgbe_sysctl_interrupt_rate_handler(SYSCTLFN_ARGS)
5926 1.1 dyoung {
5927 1.14.2.3 martin int error;
5928 1.1 dyoung struct sysctlnode node;
5929 1.1 dyoung struct ix_queue *que;
5930 1.1 dyoung uint32_t reg, usec, rate;
5931 1.1 dyoung
5932 1.1 dyoung node = *rnode;
5933 1.1 dyoung que = (struct ix_queue *)node.sysctl_data;
5934 1.1 dyoung if (que == NULL)
5935 1.1 dyoung return 0;
5936 1.1 dyoung reg = IXGBE_READ_REG(&que->adapter->hw, IXGBE_EITR(que->msix));
5937 1.1 dyoung usec = ((reg & 0x0FF8) >> 3);
5938 1.1 dyoung if (usec > 0)
5939 1.14.2.3 martin rate = 500000 / usec;
5940 1.1 dyoung else
5941 1.1 dyoung rate = 0;
5942 1.1 dyoung node.sysctl_data = &rate;
5943 1.14.2.3 martin error = sysctl_lookup(SYSCTLFN_CALL(&node));
5944 1.14.2.3 martin if (error)
5945 1.14.2.3 martin return error;
5946 1.14.2.3 martin reg &= ~0xfff; /* default, no limitation */
5947 1.14.2.3 martin ixgbe_max_interrupt_rate = 0;
5948 1.14.2.3 martin if (rate > 0 && rate < 500000) {
5949 1.14.2.3 martin if (rate < 1000)
5950 1.14.2.3 martin rate = 1000;
5951 1.14.2.3 martin ixgbe_max_interrupt_rate = rate;
5952 1.14.2.3 martin reg |= ((4000000/rate) & 0xff8 );
5953 1.14.2.3 martin }
5954 1.14.2.3 martin IXGBE_WRITE_REG(&que->adapter->hw, IXGBE_EITR(que->msix), reg);
5955 1.14.2.3 martin return 0;
5956 1.1 dyoung }
5957 1.1 dyoung
5958 1.1 dyoung const struct sysctlnode *
5959 1.1 dyoung ixgbe_sysctl_instance(struct adapter *adapter)
5960 1.1 dyoung {
5961 1.1 dyoung const char *dvname;
5962 1.1 dyoung struct sysctllog **log;
5963 1.1 dyoung int rc;
5964 1.1 dyoung const struct sysctlnode *rnode;
5965 1.1 dyoung
5966 1.1 dyoung log = &adapter->sysctllog;
5967 1.1 dyoung dvname = device_xname(adapter->dev);
5968 1.1 dyoung
5969 1.1 dyoung if ((rc = sysctl_createv(log, 0, NULL, &rnode,
5970 1.1 dyoung 0, CTLTYPE_NODE, dvname,
5971 1.1 dyoung SYSCTL_DESCR("ixgbe information and settings"),
5972 1.7 pooka NULL, 0, NULL, 0, CTL_HW, CTL_CREATE, CTL_EOL)) != 0)
5973 1.1 dyoung goto err;
5974 1.1 dyoung
5975 1.1 dyoung return rnode;
5976 1.1 dyoung err:
5977 1.1 dyoung printf("%s: sysctl_createv failed, rc = %d\n", __func__, rc);
5978 1.1 dyoung return NULL;
5979 1.1 dyoung }
5980 1.1 dyoung
5981 1.1 dyoung /*
5982 1.1 dyoung * Add sysctl variables, one per statistic, to the system.
5983 1.1 dyoung */
5984 1.1 dyoung static void
5985 1.1 dyoung ixgbe_add_hw_stats(struct adapter *adapter)
5986 1.1 dyoung {
5987 1.1 dyoung device_t dev = adapter->dev;
5988 1.1 dyoung const struct sysctlnode *rnode, *cnode;
5989 1.1 dyoung struct sysctllog **log = &adapter->sysctllog;
5990 1.1 dyoung struct tx_ring *txr = adapter->tx_rings;
5991 1.1 dyoung struct rx_ring *rxr = adapter->rx_rings;
5992 1.1 dyoung struct ixgbe_hw_stats *stats = &adapter->stats;
5993 1.1 dyoung
5994 1.1 dyoung /* Driver Statistics */
5995 1.1 dyoung #if 0
5996 1.1 dyoung /* These counters are not updated by the software */
5997 1.1 dyoung SYSCTL_ADD_ULONG(ctx, child, OID_AUTO, "dropped",
5998 1.1 dyoung CTLFLAG_RD, &adapter->dropped_pkts,
5999 1.1 dyoung "Driver dropped packets");
6000 1.1 dyoung SYSCTL_ADD_ULONG(ctx, child, OID_AUTO, "mbuf_header_failed",
6001 1.1 dyoung CTLFLAG_RD, &adapter->mbuf_header_failed,
6002 1.1 dyoung "???");
6003 1.1 dyoung SYSCTL_ADD_ULONG(ctx, child, OID_AUTO, "mbuf_packet_failed",
6004 1.1 dyoung CTLFLAG_RD, &adapter->mbuf_packet_failed,
6005 1.1 dyoung "???");
6006 1.1 dyoung SYSCTL_ADD_ULONG(ctx, child, OID_AUTO, "no_tx_map_avail",
6007 1.1 dyoung CTLFLAG_RD, &adapter->no_tx_map_avail,
6008 1.1 dyoung "???");
6009 1.1 dyoung #endif
6010 1.1 dyoung evcnt_attach_dynamic(&adapter->handleq, EVCNT_TYPE_MISC,
6011 1.1 dyoung NULL, device_xname(dev), "Handled queue in softint");
6012 1.1 dyoung evcnt_attach_dynamic(&adapter->req, EVCNT_TYPE_MISC,
6013 1.1 dyoung NULL, device_xname(dev), "Requeued in softint");
6014 1.1 dyoung evcnt_attach_dynamic(&adapter->morerx, EVCNT_TYPE_MISC,
6015 1.1 dyoung NULL, device_xname(dev), "Interrupt handler more rx");
6016 1.1 dyoung evcnt_attach_dynamic(&adapter->moretx, EVCNT_TYPE_MISC,
6017 1.1 dyoung NULL, device_xname(dev), "Interrupt handler more tx");
6018 1.1 dyoung evcnt_attach_dynamic(&adapter->txloops, EVCNT_TYPE_MISC,
6019 1.1 dyoung NULL, device_xname(dev), "Interrupt handler tx loops");
6020 1.1 dyoung evcnt_attach_dynamic(&adapter->efbig_tx_dma_setup, EVCNT_TYPE_MISC,
6021 1.1 dyoung NULL, device_xname(dev), "Driver tx dma soft fail EFBIG");
6022 1.1 dyoung evcnt_attach_dynamic(&adapter->m_defrag_failed, EVCNT_TYPE_MISC,
6023 1.1 dyoung NULL, device_xname(dev), "m_defrag() failed");
6024 1.1 dyoung evcnt_attach_dynamic(&adapter->efbig2_tx_dma_setup, EVCNT_TYPE_MISC,
6025 1.1 dyoung NULL, device_xname(dev), "Driver tx dma hard fail EFBIG");
6026 1.1 dyoung evcnt_attach_dynamic(&adapter->einval_tx_dma_setup, EVCNT_TYPE_MISC,
6027 1.1 dyoung NULL, device_xname(dev), "Driver tx dma hard fail EINVAL");
6028 1.1 dyoung evcnt_attach_dynamic(&adapter->other_tx_dma_setup, EVCNT_TYPE_MISC,
6029 1.1 dyoung NULL, device_xname(dev), "Driver tx dma hard fail other");
6030 1.1 dyoung evcnt_attach_dynamic(&adapter->eagain_tx_dma_setup, EVCNT_TYPE_MISC,
6031 1.1 dyoung NULL, device_xname(dev), "Driver tx dma soft fail EAGAIN");
6032 1.1 dyoung evcnt_attach_dynamic(&adapter->enomem_tx_dma_setup, EVCNT_TYPE_MISC,
6033 1.1 dyoung NULL, device_xname(dev), "Driver tx dma soft fail ENOMEM");
6034 1.1 dyoung evcnt_attach_dynamic(&adapter->watchdog_events, EVCNT_TYPE_MISC,
6035 1.1 dyoung NULL, device_xname(dev), "Watchdog timeouts");
6036 1.1 dyoung evcnt_attach_dynamic(&adapter->tso_err, EVCNT_TYPE_MISC,
6037 1.1 dyoung NULL, device_xname(dev), "TSO errors");
6038 1.1 dyoung evcnt_attach_dynamic(&adapter->link_irq, EVCNT_TYPE_MISC,
6039 1.1 dyoung NULL, device_xname(dev), "Link MSIX IRQ Handled");
6040 1.1 dyoung
6041 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, rxr++, txr++) {
6042 1.1 dyoung snprintf(adapter->queues[i].evnamebuf,
6043 1.1 dyoung sizeof(adapter->queues[i].evnamebuf), "%s queue%d",
6044 1.1 dyoung device_xname(dev), i);
6045 1.1 dyoung snprintf(adapter->queues[i].namebuf,
6046 1.1 dyoung sizeof(adapter->queues[i].namebuf), "queue%d", i);
6047 1.1 dyoung
6048 1.1 dyoung if ((rnode = ixgbe_sysctl_instance(adapter)) == NULL) {
6049 1.1 dyoung aprint_error_dev(dev, "could not create sysctl root\n");
6050 1.1 dyoung break;
6051 1.1 dyoung }
6052 1.1 dyoung
6053 1.1 dyoung if (sysctl_createv(log, 0, &rnode, &rnode,
6054 1.1 dyoung 0, CTLTYPE_NODE,
6055 1.1 dyoung adapter->queues[i].namebuf, SYSCTL_DESCR("Queue Name"),
6056 1.1 dyoung NULL, 0, NULL, 0, CTL_CREATE, CTL_EOL) != 0)
6057 1.1 dyoung break;
6058 1.1 dyoung
6059 1.1 dyoung if (sysctl_createv(log, 0, &rnode, &cnode,
6060 1.14.2.3 martin CTLFLAG_READWRITE, CTLTYPE_INT,
6061 1.1 dyoung "interrupt_rate", SYSCTL_DESCR("Interrupt Rate"),
6062 1.5 dsl ixgbe_sysctl_interrupt_rate_handler, 0,
6063 1.5 dsl (void *)&adapter->queues[i], 0, CTL_CREATE, CTL_EOL) != 0)
6064 1.1 dyoung break;
6065 1.1 dyoung
6066 1.1 dyoung if (sysctl_createv(log, 0, &rnode, &cnode,
6067 1.14.2.3 martin CTLFLAG_READONLY, CTLTYPE_QUAD,
6068 1.14.2.3 martin "irqs", SYSCTL_DESCR("irqs on this queue"),
6069 1.14.2.3 martin NULL, 0, &(adapter->queues[i].irqs),
6070 1.14.2.3 martin 0, CTL_CREATE, CTL_EOL) != 0)
6071 1.14.2.3 martin break;
6072 1.14.2.3 martin
6073 1.14.2.3 martin if (sysctl_createv(log, 0, &rnode, &cnode,
6074 1.1 dyoung CTLFLAG_READONLY, CTLTYPE_INT,
6075 1.1 dyoung "txd_head", SYSCTL_DESCR("Transmit Descriptor Head"),
6076 1.4 dsl ixgbe_sysctl_tdh_handler, 0, (void *)txr,
6077 1.1 dyoung 0, CTL_CREATE, CTL_EOL) != 0)
6078 1.1 dyoung break;
6079 1.1 dyoung
6080 1.1 dyoung if (sysctl_createv(log, 0, &rnode, &cnode,
6081 1.1 dyoung CTLFLAG_READONLY, CTLTYPE_INT,
6082 1.1 dyoung "txd_tail", SYSCTL_DESCR("Transmit Descriptor Tail"),
6083 1.4 dsl ixgbe_sysctl_tdt_handler, 0, (void *)txr,
6084 1.1 dyoung 0, CTL_CREATE, CTL_EOL) != 0)
6085 1.1 dyoung break;
6086 1.1 dyoung
6087 1.14.2.5 riz evcnt_attach_dynamic(&txr->tso_tx, EVCNT_TYPE_MISC,
6088 1.14.2.5 riz NULL, device_xname(dev), "TSO");
6089 1.1 dyoung evcnt_attach_dynamic(&txr->no_desc_avail, EVCNT_TYPE_MISC,
6090 1.1 dyoung NULL, adapter->queues[i].evnamebuf,
6091 1.1 dyoung "Queue No Descriptor Available");
6092 1.1 dyoung evcnt_attach_dynamic(&txr->total_packets, EVCNT_TYPE_MISC,
6093 1.1 dyoung NULL, adapter->queues[i].evnamebuf,
6094 1.1 dyoung "Queue Packets Transmitted");
6095 1.1 dyoung
6096 1.1 dyoung #ifdef LRO
6097 1.1 dyoung struct lro_ctrl *lro = &rxr->lro;
6098 1.1 dyoung #endif /* LRO */
6099 1.1 dyoung
6100 1.1 dyoung if (sysctl_createv(log, 0, &rnode, &cnode,
6101 1.1 dyoung CTLFLAG_READONLY,
6102 1.1 dyoung CTLTYPE_INT,
6103 1.1 dyoung "rxd_head", SYSCTL_DESCR("Receive Descriptor Head"),
6104 1.4 dsl ixgbe_sysctl_rdh_handler, 0, (void *)rxr, 0,
6105 1.1 dyoung CTL_CREATE, CTL_EOL) != 0)
6106 1.1 dyoung break;
6107 1.1 dyoung
6108 1.1 dyoung if (sysctl_createv(log, 0, &rnode, &cnode,
6109 1.1 dyoung CTLFLAG_READONLY,
6110 1.1 dyoung CTLTYPE_INT,
6111 1.1 dyoung "rxd_tail", SYSCTL_DESCR("Receive Descriptor Tail"),
6112 1.4 dsl ixgbe_sysctl_rdt_handler, 0, (void *)rxr, 0,
6113 1.1 dyoung CTL_CREATE, CTL_EOL) != 0)
6114 1.1 dyoung break;
6115 1.1 dyoung
6116 1.1 dyoung if (i < __arraycount(adapter->stats.mpc)) {
6117 1.1 dyoung evcnt_attach_dynamic(&adapter->stats.mpc[i],
6118 1.1 dyoung EVCNT_TYPE_MISC, NULL, adapter->queues[i].evnamebuf,
6119 1.1 dyoung "Missed Packet Count");
6120 1.1 dyoung }
6121 1.1 dyoung if (i < __arraycount(adapter->stats.pxontxc)) {
6122 1.1 dyoung evcnt_attach_dynamic(&adapter->stats.pxontxc[i],
6123 1.1 dyoung EVCNT_TYPE_MISC, NULL, adapter->queues[i].evnamebuf,
6124 1.1 dyoung "pxontxc");
6125 1.1 dyoung evcnt_attach_dynamic(&adapter->stats.pxonrxc[i],
6126 1.1 dyoung EVCNT_TYPE_MISC, NULL, adapter->queues[i].evnamebuf,
6127 1.1 dyoung "pxonrxc");
6128 1.1 dyoung evcnt_attach_dynamic(&adapter->stats.pxofftxc[i],
6129 1.1 dyoung EVCNT_TYPE_MISC, NULL, adapter->queues[i].evnamebuf,
6130 1.1 dyoung "pxofftxc");
6131 1.1 dyoung evcnt_attach_dynamic(&adapter->stats.pxoffrxc[i],
6132 1.1 dyoung EVCNT_TYPE_MISC, NULL, adapter->queues[i].evnamebuf,
6133 1.1 dyoung "pxoffrxc");
6134 1.1 dyoung evcnt_attach_dynamic(&adapter->stats.pxon2offc[i],
6135 1.1 dyoung EVCNT_TYPE_MISC, NULL, adapter->queues[i].evnamebuf,
6136 1.1 dyoung "pxon2offc");
6137 1.1 dyoung }
6138 1.1 dyoung if (i < __arraycount(adapter->stats.qprc)) {
6139 1.1 dyoung evcnt_attach_dynamic(&adapter->stats.qprc[i],
6140 1.1 dyoung EVCNT_TYPE_MISC, NULL, adapter->queues[i].evnamebuf,
6141 1.1 dyoung "qprc");
6142 1.1 dyoung evcnt_attach_dynamic(&adapter->stats.qptc[i],
6143 1.1 dyoung EVCNT_TYPE_MISC, NULL, adapter->queues[i].evnamebuf,
6144 1.1 dyoung "qptc");
6145 1.1 dyoung evcnt_attach_dynamic(&adapter->stats.qbrc[i],
6146 1.1 dyoung EVCNT_TYPE_MISC, NULL, adapter->queues[i].evnamebuf,
6147 1.1 dyoung "qbrc");
6148 1.1 dyoung evcnt_attach_dynamic(&adapter->stats.qbtc[i],
6149 1.1 dyoung EVCNT_TYPE_MISC, NULL, adapter->queues[i].evnamebuf,
6150 1.1 dyoung "qbtc");
6151 1.1 dyoung evcnt_attach_dynamic(&adapter->stats.qprdc[i],
6152 1.1 dyoung EVCNT_TYPE_MISC, NULL, adapter->queues[i].evnamebuf,
6153 1.1 dyoung "qprdc");
6154 1.1 dyoung }
6155 1.1 dyoung
6156 1.1 dyoung evcnt_attach_dynamic(&rxr->rx_packets, EVCNT_TYPE_MISC,
6157 1.1 dyoung NULL, adapter->queues[i].evnamebuf, "Queue Packets Received");
6158 1.1 dyoung evcnt_attach_dynamic(&rxr->rx_bytes, EVCNT_TYPE_MISC,
6159 1.1 dyoung NULL, adapter->queues[i].evnamebuf, "Queue Bytes Received");
6160 1.14.2.4 riz evcnt_attach_dynamic(&rxr->rx_copies, EVCNT_TYPE_MISC,
6161 1.14.2.4 riz NULL, adapter->queues[i].evnamebuf, "Copied RX Frames");
6162 1.1 dyoung evcnt_attach_dynamic(&rxr->no_jmbuf, EVCNT_TYPE_MISC,
6163 1.1 dyoung NULL, adapter->queues[i].evnamebuf, "Rx no jumbo mbuf");
6164 1.1 dyoung evcnt_attach_dynamic(&rxr->rx_discarded, EVCNT_TYPE_MISC,
6165 1.1 dyoung NULL, adapter->queues[i].evnamebuf, "Rx discarded");
6166 1.1 dyoung evcnt_attach_dynamic(&rxr->rx_irq, EVCNT_TYPE_MISC,
6167 1.1 dyoung NULL, adapter->queues[i].evnamebuf, "Rx interrupts");
6168 1.1 dyoung #ifdef LRO
6169 1.1 dyoung SYSCTL_ADD_INT(ctx, queue_list, OID_AUTO, "lro_queued",
6170 1.1 dyoung CTLFLAG_RD, &lro->lro_queued, 0,
6171 1.1 dyoung "LRO Queued");
6172 1.1 dyoung SYSCTL_ADD_INT(ctx, queue_list, OID_AUTO, "lro_flushed",
6173 1.1 dyoung CTLFLAG_RD, &lro->lro_flushed, 0,
6174 1.1 dyoung "LRO Flushed");
6175 1.1 dyoung #endif /* LRO */
6176 1.1 dyoung }
6177 1.1 dyoung
6178 1.1 dyoung /* MAC stats get the own sub node */
6179 1.1 dyoung
6180 1.1 dyoung
6181 1.1 dyoung snprintf(stats->namebuf,
6182 1.1 dyoung sizeof(stats->namebuf), "%s MAC Statistics", device_xname(dev));
6183 1.1 dyoung
6184 1.1 dyoung evcnt_attach_dynamic(&stats->ipcs, EVCNT_TYPE_MISC, NULL,
6185 1.1 dyoung stats->namebuf, "rx csum offload - IP");
6186 1.1 dyoung evcnt_attach_dynamic(&stats->l4cs, EVCNT_TYPE_MISC, NULL,
6187 1.1 dyoung stats->namebuf, "rx csum offload - L4");
6188 1.1 dyoung evcnt_attach_dynamic(&stats->ipcs_bad, EVCNT_TYPE_MISC, NULL,
6189 1.1 dyoung stats->namebuf, "rx csum offload - IP bad");
6190 1.1 dyoung evcnt_attach_dynamic(&stats->l4cs_bad, EVCNT_TYPE_MISC, NULL,
6191 1.1 dyoung stats->namebuf, "rx csum offload - L4 bad");
6192 1.1 dyoung evcnt_attach_dynamic(&stats->intzero, EVCNT_TYPE_MISC, NULL,
6193 1.1 dyoung stats->namebuf, "Interrupt conditions zero");
6194 1.1 dyoung evcnt_attach_dynamic(&stats->legint, EVCNT_TYPE_MISC, NULL,
6195 1.1 dyoung stats->namebuf, "Legacy interrupts");
6196 1.1 dyoung evcnt_attach_dynamic(&stats->crcerrs, EVCNT_TYPE_MISC, NULL,
6197 1.1 dyoung stats->namebuf, "CRC Errors");
6198 1.1 dyoung evcnt_attach_dynamic(&stats->illerrc, EVCNT_TYPE_MISC, NULL,
6199 1.1 dyoung stats->namebuf, "Illegal Byte Errors");
6200 1.1 dyoung evcnt_attach_dynamic(&stats->errbc, EVCNT_TYPE_MISC, NULL,
6201 1.1 dyoung stats->namebuf, "Byte Errors");
6202 1.1 dyoung evcnt_attach_dynamic(&stats->mspdc, EVCNT_TYPE_MISC, NULL,
6203 1.1 dyoung stats->namebuf, "MAC Short Packets Discarded");
6204 1.1 dyoung evcnt_attach_dynamic(&stats->mlfc, EVCNT_TYPE_MISC, NULL,
6205 1.1 dyoung stats->namebuf, "MAC Local Faults");
6206 1.1 dyoung evcnt_attach_dynamic(&stats->mrfc, EVCNT_TYPE_MISC, NULL,
6207 1.1 dyoung stats->namebuf, "MAC Remote Faults");
6208 1.1 dyoung evcnt_attach_dynamic(&stats->rlec, EVCNT_TYPE_MISC, NULL,
6209 1.1 dyoung stats->namebuf, "Receive Length Errors");
6210 1.1 dyoung evcnt_attach_dynamic(&stats->lxontxc, EVCNT_TYPE_MISC, NULL,
6211 1.1 dyoung stats->namebuf, "Link XON Transmitted");
6212 1.1 dyoung evcnt_attach_dynamic(&stats->lxonrxc, EVCNT_TYPE_MISC, NULL,
6213 1.1 dyoung stats->namebuf, "Link XON Received");
6214 1.1 dyoung evcnt_attach_dynamic(&stats->lxofftxc, EVCNT_TYPE_MISC, NULL,
6215 1.1 dyoung stats->namebuf, "Link XOFF Transmitted");
6216 1.1 dyoung evcnt_attach_dynamic(&stats->lxoffrxc, EVCNT_TYPE_MISC, NULL,
6217 1.1 dyoung stats->namebuf, "Link XOFF Received");
6218 1.1 dyoung
6219 1.1 dyoung /* Packet Reception Stats */
6220 1.1 dyoung evcnt_attach_dynamic(&stats->tor, EVCNT_TYPE_MISC, NULL,
6221 1.1 dyoung stats->namebuf, "Total Octets Received");
6222 1.1 dyoung evcnt_attach_dynamic(&stats->gorc, EVCNT_TYPE_MISC, NULL,
6223 1.1 dyoung stats->namebuf, "Good Octets Received");
6224 1.1 dyoung evcnt_attach_dynamic(&stats->tpr, EVCNT_TYPE_MISC, NULL,
6225 1.1 dyoung stats->namebuf, "Total Packets Received");
6226 1.1 dyoung evcnt_attach_dynamic(&stats->gprc, EVCNT_TYPE_MISC, NULL,
6227 1.1 dyoung stats->namebuf, "Good Packets Received");
6228 1.1 dyoung evcnt_attach_dynamic(&stats->mprc, EVCNT_TYPE_MISC, NULL,
6229 1.1 dyoung stats->namebuf, "Multicast Packets Received");
6230 1.1 dyoung evcnt_attach_dynamic(&stats->bprc, EVCNT_TYPE_MISC, NULL,
6231 1.1 dyoung stats->namebuf, "Broadcast Packets Received");
6232 1.1 dyoung evcnt_attach_dynamic(&stats->prc64, EVCNT_TYPE_MISC, NULL,
6233 1.1 dyoung stats->namebuf, "64 byte frames received ");
6234 1.1 dyoung evcnt_attach_dynamic(&stats->prc127, EVCNT_TYPE_MISC, NULL,
6235 1.1 dyoung stats->namebuf, "65-127 byte frames received");
6236 1.1 dyoung evcnt_attach_dynamic(&stats->prc255, EVCNT_TYPE_MISC, NULL,
6237 1.1 dyoung stats->namebuf, "128-255 byte frames received");
6238 1.1 dyoung evcnt_attach_dynamic(&stats->prc511, EVCNT_TYPE_MISC, NULL,
6239 1.1 dyoung stats->namebuf, "256-511 byte frames received");
6240 1.1 dyoung evcnt_attach_dynamic(&stats->prc1023, EVCNT_TYPE_MISC, NULL,
6241 1.1 dyoung stats->namebuf, "512-1023 byte frames received");
6242 1.1 dyoung evcnt_attach_dynamic(&stats->prc1522, EVCNT_TYPE_MISC, NULL,
6243 1.1 dyoung stats->namebuf, "1023-1522 byte frames received");
6244 1.1 dyoung evcnt_attach_dynamic(&stats->ruc, EVCNT_TYPE_MISC, NULL,
6245 1.1 dyoung stats->namebuf, "Receive Undersized");
6246 1.1 dyoung evcnt_attach_dynamic(&stats->rfc, EVCNT_TYPE_MISC, NULL,
6247 1.1 dyoung stats->namebuf, "Fragmented Packets Received ");
6248 1.1 dyoung evcnt_attach_dynamic(&stats->roc, EVCNT_TYPE_MISC, NULL,
6249 1.1 dyoung stats->namebuf, "Oversized Packets Received");
6250 1.1 dyoung evcnt_attach_dynamic(&stats->rjc, EVCNT_TYPE_MISC, NULL,
6251 1.1 dyoung stats->namebuf, "Received Jabber");
6252 1.1 dyoung evcnt_attach_dynamic(&stats->mngprc, EVCNT_TYPE_MISC, NULL,
6253 1.1 dyoung stats->namebuf, "Management Packets Received");
6254 1.1 dyoung evcnt_attach_dynamic(&stats->xec, EVCNT_TYPE_MISC, NULL,
6255 1.1 dyoung stats->namebuf, "Checksum Errors");
6256 1.1 dyoung
6257 1.1 dyoung /* Packet Transmission Stats */
6258 1.1 dyoung evcnt_attach_dynamic(&stats->gotc, EVCNT_TYPE_MISC, NULL,
6259 1.1 dyoung stats->namebuf, "Good Octets Transmitted");
6260 1.1 dyoung evcnt_attach_dynamic(&stats->tpt, EVCNT_TYPE_MISC, NULL,
6261 1.1 dyoung stats->namebuf, "Total Packets Transmitted");
6262 1.1 dyoung evcnt_attach_dynamic(&stats->gptc, EVCNT_TYPE_MISC, NULL,
6263 1.1 dyoung stats->namebuf, "Good Packets Transmitted");
6264 1.1 dyoung evcnt_attach_dynamic(&stats->bptc, EVCNT_TYPE_MISC, NULL,
6265 1.1 dyoung stats->namebuf, "Broadcast Packets Transmitted");
6266 1.1 dyoung evcnt_attach_dynamic(&stats->mptc, EVCNT_TYPE_MISC, NULL,
6267 1.1 dyoung stats->namebuf, "Multicast Packets Transmitted");
6268 1.1 dyoung evcnt_attach_dynamic(&stats->mngptc, EVCNT_TYPE_MISC, NULL,
6269 1.1 dyoung stats->namebuf, "Management Packets Transmitted");
6270 1.1 dyoung evcnt_attach_dynamic(&stats->ptc64, EVCNT_TYPE_MISC, NULL,
6271 1.1 dyoung stats->namebuf, "64 byte frames transmitted ");
6272 1.1 dyoung evcnt_attach_dynamic(&stats->ptc127, EVCNT_TYPE_MISC, NULL,
6273 1.1 dyoung stats->namebuf, "65-127 byte frames transmitted");
6274 1.1 dyoung evcnt_attach_dynamic(&stats->ptc255, EVCNT_TYPE_MISC, NULL,
6275 1.1 dyoung stats->namebuf, "128-255 byte frames transmitted");
6276 1.1 dyoung evcnt_attach_dynamic(&stats->ptc511, EVCNT_TYPE_MISC, NULL,
6277 1.1 dyoung stats->namebuf, "256-511 byte frames transmitted");
6278 1.1 dyoung evcnt_attach_dynamic(&stats->ptc1023, EVCNT_TYPE_MISC, NULL,
6279 1.1 dyoung stats->namebuf, "512-1023 byte frames transmitted");
6280 1.1 dyoung evcnt_attach_dynamic(&stats->ptc1522, EVCNT_TYPE_MISC, NULL,
6281 1.1 dyoung stats->namebuf, "1024-1522 byte frames transmitted");
6282 1.1 dyoung }
6283 1.1 dyoung
6284 1.1 dyoung /*
6285 1.1 dyoung ** Set flow control using sysctl:
6286 1.1 dyoung ** Flow control values:
6287 1.1 dyoung ** 0 - off
6288 1.1 dyoung ** 1 - rx pause
6289 1.1 dyoung ** 2 - tx pause
6290 1.1 dyoung ** 3 - full
6291 1.1 dyoung */
6292 1.1 dyoung static int
6293 1.1 dyoung ixgbe_set_flowcntl(SYSCTLFN_ARGS)
6294 1.1 dyoung {
6295 1.1 dyoung struct sysctlnode node;
6296 1.14.2.4 riz int error, last;
6297 1.1 dyoung struct adapter *adapter;
6298 1.1 dyoung
6299 1.1 dyoung node = *rnode;
6300 1.1 dyoung adapter = (struct adapter *)node.sysctl_data;
6301 1.14.2.4 riz node.sysctl_data = &adapter->fc;
6302 1.14.2.4 riz last = adapter->fc;
6303 1.1 dyoung error = sysctl_lookup(SYSCTLFN_CALL(&node));
6304 1.1 dyoung if (error != 0 || newp == NULL)
6305 1.1 dyoung return error;
6306 1.1 dyoung
6307 1.1 dyoung /* Don't bother if it's not changed */
6308 1.14.2.4 riz if (adapter->fc == last)
6309 1.1 dyoung return (0);
6310 1.1 dyoung
6311 1.14.2.4 riz switch (adapter->fc) {
6312 1.1 dyoung case ixgbe_fc_rx_pause:
6313 1.1 dyoung case ixgbe_fc_tx_pause:
6314 1.1 dyoung case ixgbe_fc_full:
6315 1.14.2.4 riz adapter->hw.fc.requested_mode = adapter->fc;
6316 1.14.2.4 riz if (adapter->num_queues > 1)
6317 1.14.2.4 riz ixgbe_disable_rx_drop(adapter);
6318 1.1 dyoung break;
6319 1.1 dyoung case ixgbe_fc_none:
6320 1.1 dyoung adapter->hw.fc.requested_mode = ixgbe_fc_none;
6321 1.14.2.4 riz if (adapter->num_queues > 1)
6322 1.14.2.4 riz ixgbe_enable_rx_drop(adapter);
6323 1.14.2.5 riz break;
6324 1.14.2.5 riz default:
6325 1.14.2.5 riz adapter->fc = last;
6326 1.14.2.5 riz return (EINVAL);
6327 1.1 dyoung }
6328 1.14.2.4 riz /* Don't autoneg if forcing a value */
6329 1.14.2.4 riz adapter->hw.fc.disable_fc_autoneg = TRUE;
6330 1.14.2.4 riz ixgbe_fc_enable(&adapter->hw);
6331 1.1 dyoung return 0;
6332 1.1 dyoung }
6333 1.1 dyoung
6334 1.14.2.6 snj
6335 1.1 dyoung /*
6336 1.1 dyoung ** Control link advertise speed:
6337 1.1 dyoung ** 1 - advertise only 1G
6338 1.14.2.4 riz ** 2 - advertise 100Mb
6339 1.14.2.4 riz ** 3 - advertise normal
6340 1.1 dyoung */
6341 1.1 dyoung static int
6342 1.1 dyoung ixgbe_set_advertise(SYSCTLFN_ARGS)
6343 1.1 dyoung {
6344 1.1 dyoung struct sysctlnode node;
6345 1.14.2.3 martin int t, error = 0;
6346 1.1 dyoung struct adapter *adapter;
6347 1.14.2.4 riz device_t dev;
6348 1.1 dyoung struct ixgbe_hw *hw;
6349 1.1 dyoung ixgbe_link_speed speed, last;
6350 1.1 dyoung
6351 1.1 dyoung node = *rnode;
6352 1.1 dyoung adapter = (struct adapter *)node.sysctl_data;
6353 1.14.2.4 riz dev = adapter->dev;
6354 1.14.2.4 riz hw = &adapter->hw;
6355 1.14.2.4 riz last = adapter->advertise;
6356 1.1 dyoung t = adapter->advertise;
6357 1.1 dyoung node.sysctl_data = &t;
6358 1.1 dyoung error = sysctl_lookup(SYSCTLFN_CALL(&node));
6359 1.1 dyoung if (error != 0 || newp == NULL)
6360 1.1 dyoung return error;
6361 1.1 dyoung
6362 1.14.2.4 riz if (adapter->advertise == last) /* no change */
6363 1.14.2.4 riz return (0);
6364 1.14.2.4 riz
6365 1.1 dyoung if (t == -1)
6366 1.1 dyoung return 0;
6367 1.1 dyoung
6368 1.1 dyoung adapter->advertise = t;
6369 1.1 dyoung
6370 1.1 dyoung if (!((hw->phy.media_type == ixgbe_media_type_copper) ||
6371 1.1 dyoung (hw->phy.multispeed_fiber)))
6372 1.14.2.5 riz return (EINVAL);
6373 1.1 dyoung
6374 1.14.2.4 riz if ((adapter->advertise == 2) && (hw->mac.type != ixgbe_mac_X540)) {
6375 1.14.2.4 riz device_printf(dev, "Set Advertise: 100Mb on X540 only\n");
6376 1.14.2.5 riz return (EINVAL);
6377 1.14.2.4 riz }
6378 1.14.2.4 riz
6379 1.1 dyoung if (adapter->advertise == 1)
6380 1.1 dyoung speed = IXGBE_LINK_SPEED_1GB_FULL;
6381 1.14.2.4 riz else if (adapter->advertise == 2)
6382 1.14.2.4 riz speed = IXGBE_LINK_SPEED_100_FULL;
6383 1.14.2.4 riz else if (adapter->advertise == 3)
6384 1.1 dyoung speed = IXGBE_LINK_SPEED_1GB_FULL |
6385 1.1 dyoung IXGBE_LINK_SPEED_10GB_FULL;
6386 1.14.2.6 snj else { /* bogus value */
6387 1.14.2.5 riz adapter->advertise = last;
6388 1.14.2.5 riz return (EINVAL);
6389 1.14.2.5 riz }
6390 1.1 dyoung
6391 1.1 dyoung hw->mac.autotry_restart = TRUE;
6392 1.14.2.5 riz hw->mac.ops.setup_link(hw, speed, TRUE);
6393 1.1 dyoung
6394 1.1 dyoung return 0;
6395 1.1 dyoung }
6396 1.14.2.4 riz
6397 1.14.2.4 riz /*
6398 1.14.2.4 riz ** Thermal Shutdown Trigger
6399 1.14.2.4 riz ** - cause a Thermal Overtemp IRQ
6400 1.14.2.6 snj ** - this now requires firmware enabling
6401 1.14.2.4 riz */
6402 1.14.2.4 riz static int
6403 1.14.2.4 riz ixgbe_set_thermal_test(SYSCTLFN_ARGS)
6404 1.14.2.4 riz {
6405 1.14.2.4 riz struct sysctlnode node;
6406 1.14.2.4 riz int error, fire = 0;
6407 1.14.2.4 riz struct adapter *adapter;
6408 1.14.2.4 riz struct ixgbe_hw *hw;
6409 1.14.2.4 riz
6410 1.14.2.4 riz node = *rnode;
6411 1.14.2.4 riz adapter = (struct adapter *)node.sysctl_data;
6412 1.14.2.4 riz hw = &adapter->hw;
6413 1.14.2.4 riz
6414 1.14.2.4 riz if (hw->mac.type != ixgbe_mac_X540)
6415 1.14.2.4 riz return (0);
6416 1.14.2.4 riz
6417 1.14.2.4 riz node.sysctl_data = &fire;
6418 1.14.2.4 riz error = sysctl_lookup(SYSCTLFN_CALL(&node));
6419 1.14.2.4 riz if ((error) || (newp == NULL))
6420 1.14.2.4 riz return (error);
6421 1.14.2.4 riz
6422 1.14.2.4 riz if (fire) {
6423 1.14.2.4 riz u32 reg = IXGBE_READ_REG(hw, IXGBE_EICS);
6424 1.14.2.4 riz reg |= IXGBE_EICR_TS;
6425 1.14.2.4 riz IXGBE_WRITE_REG(hw, IXGBE_EICS, reg);
6426 1.14.2.4 riz }
6427 1.14.2.4 riz
6428 1.14.2.4 riz return (0);
6429 1.14.2.4 riz }
6430 1.14.2.4 riz
6431 1.14.2.4 riz /*
6432 1.14.2.4 riz ** Enable the hardware to drop packets when the buffer is
6433 1.14.2.4 riz ** full. This is useful when multiqueue,so that no single
6434 1.14.2.4 riz ** queue being full stalls the entire RX engine. We only
6435 1.14.2.4 riz ** enable this when Multiqueue AND when Flow Control is
6436 1.14.2.4 riz ** disabled.
6437 1.14.2.4 riz */
6438 1.14.2.4 riz static void
6439 1.14.2.4 riz ixgbe_enable_rx_drop(struct adapter *adapter)
6440 1.14.2.4 riz {
6441 1.14.2.4 riz struct ixgbe_hw *hw = &adapter->hw;
6442 1.14.2.4 riz
6443 1.14.2.4 riz for (int i = 0; i < adapter->num_queues; i++) {
6444 1.14.2.4 riz u32 srrctl = IXGBE_READ_REG(hw, IXGBE_SRRCTL(i));
6445 1.14.2.4 riz srrctl |= IXGBE_SRRCTL_DROP_EN;
6446 1.14.2.4 riz IXGBE_WRITE_REG(hw, IXGBE_SRRCTL(i), srrctl);
6447 1.14.2.4 riz }
6448 1.14.2.4 riz }
6449 1.14.2.4 riz
6450 1.14.2.4 riz static void
6451 1.14.2.4 riz ixgbe_disable_rx_drop(struct adapter *adapter)
6452 1.14.2.4 riz {
6453 1.14.2.4 riz struct ixgbe_hw *hw = &adapter->hw;
6454 1.14.2.4 riz
6455 1.14.2.4 riz for (int i = 0; i < adapter->num_queues; i++) {
6456 1.14.2.4 riz u32 srrctl = IXGBE_READ_REG(hw, IXGBE_SRRCTL(i));
6457 1.14.2.4 riz srrctl &= ~IXGBE_SRRCTL_DROP_EN;
6458 1.14.2.4 riz IXGBE_WRITE_REG(hw, IXGBE_SRRCTL(i), srrctl);
6459 1.14.2.4 riz }
6460 1.14.2.4 riz }
6461