ether_sw_offload.c revision 1.5 1 1.5 rin /* $NetBSD: ether_sw_offload.c,v 1.5 2018/12/15 07:29:44 rin Exp $ */
2 1.1 rin
3 1.1 rin /*
4 1.1 rin * Copyright (c) 2018 The NetBSD Foundation, Inc.
5 1.1 rin * All rights reserved.
6 1.1 rin *
7 1.1 rin * This code is derived from software contributed to The NetBSD Foundation
8 1.1 rin * by Rin Okuyama.
9 1.1 rin *
10 1.1 rin * Redistribution and use in source and binary forms, with or without
11 1.1 rin * modification, are permitted provided that the following conditions
12 1.1 rin * are met:
13 1.1 rin * 1. Redistributions of source code must retain the above copyright
14 1.1 rin * notice, this list of conditions and the following disclaimer.
15 1.1 rin * 2. Redistributions in binary form must reproduce the above copyright
16 1.1 rin * notice, this list of conditions and the following disclaimer in the
17 1.1 rin * documentation and/or other materials provided with the distribution.
18 1.1 rin *
19 1.1 rin * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.1 rin * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.1 rin * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.1 rin * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.1 rin * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.1 rin * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.1 rin * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.1 rin * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.1 rin * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.1 rin * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.1 rin * POSSIBILITY OF SUCH DAMAGE.
30 1.1 rin */
31 1.1 rin
32 1.2 rin #ifdef _KERNEL_OPT
33 1.2 rin #include "opt_inet.h"
34 1.2 rin #endif
35 1.2 rin
36 1.1 rin #include <sys/cdefs.h>
37 1.5 rin __KERNEL_RCSID(0, "$NetBSD: ether_sw_offload.c,v 1.5 2018/12/15 07:29:44 rin Exp $");
38 1.1 rin
39 1.1 rin #include <sys/param.h>
40 1.1 rin #include <sys/types.h>
41 1.1 rin #include <sys/mbuf.h>
42 1.5 rin #include <sys/syslog.h>
43 1.5 rin #include <sys/time.h>
44 1.1 rin
45 1.1 rin #include <net/if.h>
46 1.1 rin #include <net/if_ether.h>
47 1.1 rin #include <net/ether_sw_offload.h>
48 1.1 rin
49 1.1 rin #include <netinet/in.h>
50 1.1 rin #include <netinet/in_offload.h>
51 1.1 rin #include <netinet/ip.h>
52 1.1 rin #include <netinet/tcp.h>
53 1.1 rin #include <netinet/udp.h>
54 1.1 rin
55 1.2 rin #ifdef INET6
56 1.2 rin #include <netinet/ip6.h>
57 1.1 rin #include <netinet6/in6.h>
58 1.1 rin #include <netinet6/in6_offload.h>
59 1.2 rin #endif
60 1.1 rin
61 1.1 rin /*
62 1.5 rin * Limit error messages at most once per 10 seconds.
63 1.5 rin */
64 1.5 rin static const struct timeval eso_err_interval = {
65 1.5 rin .tv_sec = 10,
66 1.5 rin .tv_usec = 0,
67 1.5 rin };
68 1.5 rin static struct timeval eso_err_lasttime;
69 1.5 rin
70 1.5 rin /*
71 1.1 rin * Handle TX offload in software. For TSO, split the packet into
72 1.1 rin * chanks with payloads of size MSS. For chekcsum offload, update
73 1.1 rin * required checksum fields. The results are more than one packet
74 1.1 rin * in general. Return a mbuf chain consists of them.
75 1.1 rin */
76 1.1 rin
77 1.1 rin struct mbuf *
78 1.1 rin ether_sw_offload_tx(struct ifnet *ifp, struct mbuf *m)
79 1.1 rin {
80 1.1 rin struct ether_header *ep;
81 1.1 rin int flags, ehlen;
82 1.5 rin uint16_t type;
83 1.3 rin #ifdef INET6
84 1.2 rin bool v6;
85 1.3 rin #else
86 1.3 rin bool v6 __diagused;
87 1.3 rin #endif
88 1.1 rin
89 1.1 rin KASSERT(m->m_flags & M_PKTHDR);
90 1.1 rin flags = m->m_pkthdr.csum_flags;
91 1.1 rin if (flags == 0)
92 1.1 rin goto done;
93 1.1 rin
94 1.1 rin /* Sanity check */
95 1.1 rin if (!TX_OFFLOAD_SUPPORTED(ifp->if_csum_flags_tx, flags))
96 1.1 rin goto quit;
97 1.1 rin
98 1.1 rin KASSERT(m->m_pkthdr.len >= sizeof(*ep));
99 1.1 rin if (m->m_len < sizeof(*ep)) {
100 1.1 rin m = m_pullup(m, sizeof(*ep));
101 1.1 rin if (m == NULL)
102 1.1 rin return NULL;
103 1.1 rin }
104 1.1 rin ep = mtod(m, struct ether_header *);
105 1.5 rin switch (type = ntohs(ep->ether_type)) {
106 1.1 rin case ETHERTYPE_IP:
107 1.1 rin case ETHERTYPE_IPV6:
108 1.1 rin ehlen = ETHER_HDR_LEN;
109 1.1 rin break;
110 1.1 rin case ETHERTYPE_VLAN:
111 1.1 rin ehlen = ETHER_HDR_LEN + ETHER_VLAN_ENCAP_LEN;
112 1.1 rin break;
113 1.1 rin default:
114 1.5 rin if (ratecheck(&eso_err_lasttime, &eso_err_interval))
115 1.5 rin log(LOG_ERR, "%s: %s: dropping invalid frame "
116 1.5 rin "type 0x%04hx csum_flags 0x%08x\n",
117 1.5 rin __func__, ifp->if_xname, type, flags);
118 1.5 rin goto quit;
119 1.1 rin }
120 1.1 rin KASSERT(m->m_pkthdr.len >= ehlen);
121 1.1 rin
122 1.2 rin v6 = flags & (M_CSUM_TSOv6 | M_CSUM_TCPv6 | M_CSUM_UDPv6);
123 1.2 rin #ifndef INET6
124 1.2 rin KASSERT(!v6);
125 1.2 rin #endif
126 1.1 rin
127 1.1 rin if (flags & (M_CSUM_TSOv4 | M_CSUM_TSOv6)) {
128 1.1 rin /*
129 1.1 rin * tcp[46]_segment() assume that size of payloads is
130 1.1 rin * a multiple of MSS. Further, tcp6_segment() assumes
131 1.1 rin * no extention headers.
132 1.1 rin *
133 1.1 rin * XXX Do we need some KASSERT's?
134 1.1 rin */
135 1.2 rin #ifdef INET6
136 1.2 rin if (v6)
137 1.2 rin return tcp6_segment(m, ehlen);
138 1.2 rin else
139 1.2 rin #endif
140 1.1 rin return tcp4_segment(m, ehlen);
141 1.1 rin }
142 1.1 rin
143 1.2 rin #ifdef INET6
144 1.2 rin if (v6)
145 1.2 rin in6_undefer_cksum(m, ehlen, flags);
146 1.2 rin else
147 1.2 rin #endif
148 1.1 rin in_undefer_cksum(m, ehlen, flags);
149 1.1 rin done:
150 1.1 rin m->m_pkthdr.csum_flags = 0;
151 1.1 rin m->m_nextpkt = NULL;
152 1.1 rin return m;
153 1.1 rin quit:
154 1.1 rin m_freem(m);
155 1.1 rin return NULL;
156 1.1 rin }
157 1.1 rin
158 1.1 rin /*
159 1.1 rin * Handle RX offload in software.
160 1.1 rin *
161 1.1 rin * XXX Fragmented packets or packets with IPv6 extension headers
162 1.1 rin * are not currently supported.
163 1.1 rin */
164 1.1 rin
165 1.1 rin struct mbuf *
166 1.1 rin ether_sw_offload_rx(struct ifnet *ifp, struct mbuf *m)
167 1.1 rin {
168 1.1 rin struct ether_header *eh;
169 1.1 rin struct ip *ip;
170 1.1 rin struct tcphdr *th;
171 1.1 rin struct udphdr *uh;
172 1.1 rin uint16_t sum, osum;
173 1.1 rin uint8_t proto;
174 1.1 rin int flags, enabled, len, ehlen, iphlen, l4offset;
175 1.2 rin bool v6;
176 1.1 rin
177 1.1 rin flags = 0;
178 1.1 rin
179 1.1 rin enabled = ifp->if_csum_flags_rx;
180 1.1 rin if (!(enabled & (M_CSUM_IPv4 | M_CSUM_TCPv4 | M_CSUM_UDPv4 |
181 1.1 rin M_CSUM_TCPv6 | M_CSUM_UDPv6)))
182 1.1 rin goto done;
183 1.1 rin
184 1.1 rin KASSERT(m->m_flags & M_PKTHDR);
185 1.1 rin len = m->m_pkthdr.len;
186 1.1 rin
187 1.1 rin KASSERT(len >= sizeof(*eh));
188 1.1 rin if (m->m_len < sizeof(*eh)) {
189 1.1 rin m = m_pullup(m, sizeof(*eh));
190 1.1 rin if (m == NULL)
191 1.1 rin return NULL;
192 1.1 rin }
193 1.1 rin eh = mtod(m, struct ether_header *);
194 1.1 rin switch (htons(eh->ether_type)) {
195 1.1 rin case ETHERTYPE_IP:
196 1.1 rin case ETHERTYPE_IPV6:
197 1.1 rin ehlen = ETHER_HDR_LEN;
198 1.1 rin break;
199 1.1 rin case ETHERTYPE_VLAN:
200 1.1 rin ehlen = ETHER_HDR_LEN + ETHER_VLAN_ENCAP_LEN;
201 1.1 rin break;
202 1.1 rin default:
203 1.1 rin goto done;
204 1.1 rin }
205 1.1 rin
206 1.1 rin KASSERT(len >= ehlen);
207 1.1 rin len = m->m_pkthdr.len - ehlen;
208 1.1 rin
209 1.1 rin KASSERT(len >= sizeof(*ip));
210 1.1 rin if (m->m_len < ehlen + sizeof(*ip)) {
211 1.1 rin m = m_pullup(m, ehlen + sizeof(*ip));
212 1.1 rin if (m == NULL)
213 1.1 rin return NULL;
214 1.1 rin }
215 1.1 rin ip = (void *)(mtod(m, char *) + ehlen);
216 1.2 rin v6 = (ip->ip_v != IPVERSION);
217 1.2 rin
218 1.2 rin if (v6) {
219 1.2 rin #ifdef INET6
220 1.2 rin struct ip6_hdr *ip6;
221 1.2 rin
222 1.2 rin KASSERT(len >= sizeof(*ip6));
223 1.2 rin if (m->m_len < ehlen + sizeof(*ip6)) {
224 1.2 rin m = m_pullup(m, ehlen + sizeof(*ip6));
225 1.2 rin if (m == NULL)
226 1.2 rin return NULL;
227 1.2 rin }
228 1.2 rin ip6 = (void *)(mtod(m, char *) + ehlen);
229 1.2 rin KASSERT((ip6->ip6_vfc & IPV6_VERSION_MASK) == IPV6_VERSION);
230 1.1 rin
231 1.2 rin iphlen = sizeof(*ip6);
232 1.2 rin
233 1.2 rin len -= iphlen;
234 1.2 rin
235 1.2 rin proto = ip6->ip6_nxt;
236 1.2 rin switch (proto) {
237 1.2 rin case IPPROTO_TCP:
238 1.2 rin if (!(enabled & M_CSUM_TCPv6))
239 1.2 rin goto done;
240 1.2 rin break;
241 1.2 rin case IPPROTO_UDP:
242 1.2 rin if (!(enabled & M_CSUM_UDPv6))
243 1.2 rin goto done;
244 1.2 rin break;
245 1.2 rin default:
246 1.2 rin /* XXX Extension headers are not supported. */
247 1.2 rin goto done;
248 1.2 rin }
249 1.2 rin
250 1.2 rin sum = in6_cksum_phdr(&ip6->ip6_src, &ip6->ip6_dst, htonl(len),
251 1.2 rin htonl(proto));
252 1.2 rin #else
253 1.2 rin goto done;
254 1.2 rin #endif
255 1.2 rin } else {
256 1.1 rin if (enabled & M_CSUM_IPv4)
257 1.1 rin flags |= M_CSUM_IPv4;
258 1.1 rin
259 1.1 rin iphlen = ip->ip_hl << 2;
260 1.1 rin KASSERT(iphlen >= sizeof(*ip));
261 1.1 rin
262 1.1 rin len -= iphlen;
263 1.1 rin KASSERT(len >= 0);
264 1.1 rin
265 1.1 rin if (in4_cksum(m, 0, ehlen, iphlen) != 0) {
266 1.1 rin if (enabled & M_CSUM_IPv4)
267 1.1 rin flags |= M_CSUM_IPv4_BAD;
268 1.1 rin /* Broken. Do not check further. */
269 1.1 rin goto done;
270 1.1 rin }
271 1.1 rin
272 1.1 rin /* Check if fragmented. */
273 1.1 rin if (ntohs(ip->ip_off) & ~(IP_DF | IP_RF))
274 1.1 rin goto done;
275 1.1 rin
276 1.1 rin proto = ip->ip_p;
277 1.1 rin switch (proto) {
278 1.1 rin case IPPROTO_TCP:
279 1.1 rin if (!(enabled & M_CSUM_TCPv4))
280 1.1 rin goto done;
281 1.1 rin break;
282 1.1 rin case IPPROTO_UDP:
283 1.1 rin if (!(enabled & M_CSUM_UDPv4))
284 1.1 rin goto done;
285 1.1 rin break;
286 1.1 rin default:
287 1.1 rin goto done;
288 1.1 rin }
289 1.1 rin
290 1.1 rin sum = in_cksum_phdr(ip->ip_src.s_addr, ip->ip_dst.s_addr,
291 1.1 rin htons((uint16_t)len + proto));
292 1.1 rin }
293 1.1 rin
294 1.1 rin l4offset = ehlen + iphlen;
295 1.1 rin switch (proto) {
296 1.1 rin case IPPROTO_TCP:
297 1.1 rin KASSERT(len >= sizeof(*th));
298 1.1 rin if (m->m_len < l4offset + sizeof(*th)) {
299 1.1 rin m = m_pullup(m, l4offset + sizeof(*th));
300 1.1 rin if (m == NULL)
301 1.1 rin return NULL;
302 1.1 rin }
303 1.1 rin th = (void *)(mtod(m, char *) + l4offset);
304 1.1 rin osum = th->th_sum;
305 1.1 rin th->th_sum = sum;
306 1.2 rin #ifdef INET6
307 1.2 rin if (v6) {
308 1.2 rin flags |= M_CSUM_TCPv6;
309 1.2 rin sum = in6_cksum(m, 0, l4offset, len);
310 1.2 rin } else
311 1.2 rin #endif
312 1.2 rin {
313 1.1 rin flags |= M_CSUM_TCPv4;
314 1.1 rin sum = in4_cksum(m, 0, l4offset, len);
315 1.1 rin }
316 1.1 rin if (sum != osum)
317 1.1 rin flags |= M_CSUM_TCP_UDP_BAD;
318 1.1 rin th->th_sum = osum;
319 1.1 rin break;
320 1.1 rin case IPPROTO_UDP:
321 1.1 rin KASSERT(len >= sizeof(*uh));
322 1.1 rin if (m->m_len < l4offset + sizeof(*uh)) {
323 1.1 rin m = m_pullup(m, l4offset + sizeof(*uh));
324 1.1 rin if (m == NULL)
325 1.1 rin return NULL;
326 1.1 rin }
327 1.1 rin uh = (void *)(mtod(m, char *) + l4offset);
328 1.1 rin osum = uh->uh_sum;
329 1.1 rin if (osum == 0)
330 1.1 rin break;
331 1.1 rin uh->uh_sum = sum;
332 1.2 rin #ifdef INET6
333 1.2 rin if (v6) {
334 1.2 rin flags |= M_CSUM_UDPv6;
335 1.2 rin sum = in6_cksum(m, 0, l4offset, len);
336 1.2 rin } else
337 1.2 rin #endif
338 1.2 rin {
339 1.1 rin flags |= M_CSUM_UDPv4;
340 1.1 rin sum = in4_cksum(m, 0, l4offset, len);
341 1.1 rin }
342 1.1 rin if (sum == 0)
343 1.1 rin sum = 0xffff;
344 1.1 rin if (sum != osum)
345 1.1 rin flags |= M_CSUM_TCP_UDP_BAD;
346 1.1 rin uh->uh_sum = osum;
347 1.1 rin break;
348 1.1 rin default:
349 1.1 rin panic("%s: impossible", __func__);
350 1.1 rin }
351 1.1 rin
352 1.1 rin done:
353 1.1 rin m->m_pkthdr.csum_flags = flags;
354 1.1 rin return m;
355 1.1 rin }
356