ether_sw_offload.c revision 1.2 1 1.2 rin /* $NetBSD: ether_sw_offload.c,v 1.2 2018/12/13 12:13:33 rin Exp $ */
2 1.1 rin
3 1.1 rin /*
4 1.1 rin * Copyright (c) 2018 The NetBSD Foundation, Inc.
5 1.1 rin * All rights reserved.
6 1.1 rin *
7 1.1 rin * This code is derived from software contributed to The NetBSD Foundation
8 1.1 rin * by Rin Okuyama.
9 1.1 rin *
10 1.1 rin * Redistribution and use in source and binary forms, with or without
11 1.1 rin * modification, are permitted provided that the following conditions
12 1.1 rin * are met:
13 1.1 rin * 1. Redistributions of source code must retain the above copyright
14 1.1 rin * notice, this list of conditions and the following disclaimer.
15 1.1 rin * 2. Redistributions in binary form must reproduce the above copyright
16 1.1 rin * notice, this list of conditions and the following disclaimer in the
17 1.1 rin * documentation and/or other materials provided with the distribution.
18 1.1 rin *
19 1.1 rin * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.1 rin * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.1 rin * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.1 rin * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.1 rin * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.1 rin * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.1 rin * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.1 rin * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.1 rin * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.1 rin * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.1 rin * POSSIBILITY OF SUCH DAMAGE.
30 1.1 rin */
31 1.1 rin
32 1.2 rin #ifdef _KERNEL_OPT
33 1.2 rin #include "opt_inet.h"
34 1.2 rin #endif
35 1.2 rin
36 1.1 rin #include <sys/cdefs.h>
37 1.2 rin __KERNEL_RCSID(0, "$NetBSD: ether_sw_offload.c,v 1.2 2018/12/13 12:13:33 rin Exp $");
38 1.1 rin
39 1.1 rin #include <sys/param.h>
40 1.1 rin #include <sys/types.h>
41 1.1 rin #include <sys/mbuf.h>
42 1.1 rin
43 1.1 rin #include <net/if.h>
44 1.1 rin #include <net/if_ether.h>
45 1.1 rin #include <net/ether_sw_offload.h>
46 1.1 rin
47 1.1 rin #include <netinet/in.h>
48 1.1 rin #include <netinet/in_offload.h>
49 1.1 rin #include <netinet/ip.h>
50 1.1 rin #include <netinet/tcp.h>
51 1.1 rin #include <netinet/udp.h>
52 1.1 rin
53 1.2 rin #ifdef INET6
54 1.2 rin #include <netinet/ip6.h>
55 1.1 rin #include <netinet6/in6.h>
56 1.1 rin #include <netinet6/in6_offload.h>
57 1.2 rin #endif
58 1.1 rin
59 1.1 rin /*
60 1.1 rin * Handle TX offload in software. For TSO, split the packet into
61 1.1 rin * chanks with payloads of size MSS. For chekcsum offload, update
62 1.1 rin * required checksum fields. The results are more than one packet
63 1.1 rin * in general. Return a mbuf chain consists of them.
64 1.1 rin */
65 1.1 rin
66 1.1 rin struct mbuf *
67 1.1 rin ether_sw_offload_tx(struct ifnet *ifp, struct mbuf *m)
68 1.1 rin {
69 1.1 rin struct ether_header *ep;
70 1.1 rin int flags, ehlen;
71 1.2 rin bool v6;
72 1.1 rin
73 1.1 rin KASSERT(m->m_flags & M_PKTHDR);
74 1.1 rin flags = m->m_pkthdr.csum_flags;
75 1.1 rin if (flags == 0)
76 1.1 rin goto done;
77 1.1 rin
78 1.1 rin /* Sanity check */
79 1.1 rin if (!TX_OFFLOAD_SUPPORTED(ifp->if_csum_flags_tx, flags))
80 1.1 rin goto quit;
81 1.1 rin
82 1.1 rin KASSERT(m->m_pkthdr.len >= sizeof(*ep));
83 1.1 rin if (m->m_len < sizeof(*ep)) {
84 1.1 rin m = m_pullup(m, sizeof(*ep));
85 1.1 rin if (m == NULL)
86 1.1 rin return NULL;
87 1.1 rin }
88 1.1 rin ep = mtod(m, struct ether_header *);
89 1.1 rin switch (ntohs(ep->ether_type)) {
90 1.1 rin case ETHERTYPE_IP:
91 1.1 rin case ETHERTYPE_IPV6:
92 1.1 rin ehlen = ETHER_HDR_LEN;
93 1.1 rin break;
94 1.1 rin case ETHERTYPE_VLAN:
95 1.1 rin ehlen = ETHER_HDR_LEN + ETHER_VLAN_ENCAP_LEN;
96 1.1 rin break;
97 1.1 rin default:
98 1.1 rin goto quit;
99 1.1 rin }
100 1.1 rin KASSERT(m->m_pkthdr.len >= ehlen);
101 1.1 rin
102 1.2 rin v6 = flags & (M_CSUM_TSOv6 | M_CSUM_TCPv6 | M_CSUM_UDPv6);
103 1.2 rin #ifndef INET6
104 1.2 rin KASSERT(!v6);
105 1.2 rin #endif
106 1.1 rin
107 1.1 rin if (flags & (M_CSUM_TSOv4 | M_CSUM_TSOv6)) {
108 1.1 rin /*
109 1.1 rin * tcp[46]_segment() assume that size of payloads is
110 1.1 rin * a multiple of MSS. Further, tcp6_segment() assumes
111 1.1 rin * no extention headers.
112 1.1 rin *
113 1.1 rin * XXX Do we need some KASSERT's?
114 1.1 rin */
115 1.2 rin #ifdef INET6
116 1.2 rin if (v6)
117 1.2 rin return tcp6_segment(m, ehlen);
118 1.2 rin else
119 1.2 rin #endif
120 1.1 rin return tcp4_segment(m, ehlen);
121 1.1 rin }
122 1.1 rin
123 1.2 rin #ifdef INET6
124 1.2 rin if (v6)
125 1.2 rin in6_undefer_cksum(m, ehlen, flags);
126 1.2 rin else
127 1.2 rin #endif
128 1.1 rin in_undefer_cksum(m, ehlen, flags);
129 1.1 rin done:
130 1.1 rin m->m_pkthdr.csum_flags = 0;
131 1.1 rin m->m_nextpkt = NULL;
132 1.1 rin return m;
133 1.1 rin quit:
134 1.1 rin m_freem(m);
135 1.1 rin return NULL;
136 1.1 rin }
137 1.1 rin
138 1.1 rin /*
139 1.1 rin * Handle RX offload in software.
140 1.1 rin *
141 1.1 rin * XXX Fragmented packets or packets with IPv6 extension headers
142 1.1 rin * are not currently supported.
143 1.1 rin */
144 1.1 rin
145 1.1 rin struct mbuf *
146 1.1 rin ether_sw_offload_rx(struct ifnet *ifp, struct mbuf *m)
147 1.1 rin {
148 1.1 rin struct ether_header *eh;
149 1.1 rin struct ip *ip;
150 1.1 rin struct tcphdr *th;
151 1.1 rin struct udphdr *uh;
152 1.1 rin uint16_t sum, osum;
153 1.1 rin uint8_t proto;
154 1.1 rin int flags, enabled, len, ehlen, iphlen, l4offset;
155 1.2 rin bool v6;
156 1.1 rin
157 1.1 rin flags = 0;
158 1.1 rin
159 1.1 rin enabled = ifp->if_csum_flags_rx;
160 1.1 rin if (!(enabled & (M_CSUM_IPv4 | M_CSUM_TCPv4 | M_CSUM_UDPv4 |
161 1.1 rin M_CSUM_TCPv6 | M_CSUM_UDPv6)))
162 1.1 rin goto done;
163 1.1 rin
164 1.1 rin KASSERT(m->m_flags & M_PKTHDR);
165 1.1 rin len = m->m_pkthdr.len;
166 1.1 rin
167 1.1 rin KASSERT(len >= sizeof(*eh));
168 1.1 rin if (m->m_len < sizeof(*eh)) {
169 1.1 rin m = m_pullup(m, sizeof(*eh));
170 1.1 rin if (m == NULL)
171 1.1 rin return NULL;
172 1.1 rin }
173 1.1 rin eh = mtod(m, struct ether_header *);
174 1.1 rin switch (htons(eh->ether_type)) {
175 1.1 rin case ETHERTYPE_IP:
176 1.1 rin case ETHERTYPE_IPV6:
177 1.1 rin ehlen = ETHER_HDR_LEN;
178 1.1 rin break;
179 1.1 rin case ETHERTYPE_VLAN:
180 1.1 rin ehlen = ETHER_HDR_LEN + ETHER_VLAN_ENCAP_LEN;
181 1.1 rin break;
182 1.1 rin default:
183 1.1 rin goto done;
184 1.1 rin }
185 1.1 rin
186 1.1 rin KASSERT(len >= ehlen);
187 1.1 rin len = m->m_pkthdr.len - ehlen;
188 1.1 rin
189 1.1 rin KASSERT(len >= sizeof(*ip));
190 1.1 rin if (m->m_len < ehlen + sizeof(*ip)) {
191 1.1 rin m = m_pullup(m, ehlen + sizeof(*ip));
192 1.1 rin if (m == NULL)
193 1.1 rin return NULL;
194 1.1 rin }
195 1.1 rin ip = (void *)(mtod(m, char *) + ehlen);
196 1.2 rin v6 = (ip->ip_v != IPVERSION);
197 1.2 rin
198 1.2 rin if (v6) {
199 1.2 rin #ifdef INET6
200 1.2 rin struct ip6_hdr *ip6;
201 1.2 rin
202 1.2 rin KASSERT(len >= sizeof(*ip6));
203 1.2 rin if (m->m_len < ehlen + sizeof(*ip6)) {
204 1.2 rin m = m_pullup(m, ehlen + sizeof(*ip6));
205 1.2 rin if (m == NULL)
206 1.2 rin return NULL;
207 1.2 rin }
208 1.2 rin ip6 = (void *)(mtod(m, char *) + ehlen);
209 1.2 rin KASSERT((ip6->ip6_vfc & IPV6_VERSION_MASK) == IPV6_VERSION);
210 1.1 rin
211 1.2 rin iphlen = sizeof(*ip6);
212 1.2 rin
213 1.2 rin len -= iphlen;
214 1.2 rin
215 1.2 rin proto = ip6->ip6_nxt;
216 1.2 rin switch (proto) {
217 1.2 rin case IPPROTO_TCP:
218 1.2 rin if (!(enabled & M_CSUM_TCPv6))
219 1.2 rin goto done;
220 1.2 rin break;
221 1.2 rin case IPPROTO_UDP:
222 1.2 rin if (!(enabled & M_CSUM_UDPv6))
223 1.2 rin goto done;
224 1.2 rin break;
225 1.2 rin default:
226 1.2 rin /* XXX Extension headers are not supported. */
227 1.2 rin goto done;
228 1.2 rin }
229 1.2 rin
230 1.2 rin sum = in6_cksum_phdr(&ip6->ip6_src, &ip6->ip6_dst, htonl(len),
231 1.2 rin htonl(proto));
232 1.2 rin #else
233 1.2 rin goto done;
234 1.2 rin #endif
235 1.2 rin } else {
236 1.1 rin if (enabled & M_CSUM_IPv4)
237 1.1 rin flags |= M_CSUM_IPv4;
238 1.1 rin
239 1.1 rin iphlen = ip->ip_hl << 2;
240 1.1 rin KASSERT(iphlen >= sizeof(*ip));
241 1.1 rin
242 1.1 rin len -= iphlen;
243 1.1 rin KASSERT(len >= 0);
244 1.1 rin
245 1.1 rin if (in4_cksum(m, 0, ehlen, iphlen) != 0) {
246 1.1 rin if (enabled & M_CSUM_IPv4)
247 1.1 rin flags |= M_CSUM_IPv4_BAD;
248 1.1 rin /* Broken. Do not check further. */
249 1.1 rin goto done;
250 1.1 rin }
251 1.1 rin
252 1.1 rin /* Check if fragmented. */
253 1.1 rin if (ntohs(ip->ip_off) & ~(IP_DF | IP_RF))
254 1.1 rin goto done;
255 1.1 rin
256 1.1 rin proto = ip->ip_p;
257 1.1 rin switch (proto) {
258 1.1 rin case IPPROTO_TCP:
259 1.1 rin if (!(enabled & M_CSUM_TCPv4))
260 1.1 rin goto done;
261 1.1 rin break;
262 1.1 rin case IPPROTO_UDP:
263 1.1 rin if (!(enabled & M_CSUM_UDPv4))
264 1.1 rin goto done;
265 1.1 rin break;
266 1.1 rin default:
267 1.1 rin goto done;
268 1.1 rin }
269 1.1 rin
270 1.1 rin sum = in_cksum_phdr(ip->ip_src.s_addr, ip->ip_dst.s_addr,
271 1.1 rin htons((uint16_t)len + proto));
272 1.1 rin }
273 1.1 rin
274 1.1 rin l4offset = ehlen + iphlen;
275 1.1 rin switch (proto) {
276 1.1 rin case IPPROTO_TCP:
277 1.1 rin KASSERT(len >= sizeof(*th));
278 1.1 rin if (m->m_len < l4offset + sizeof(*th)) {
279 1.1 rin m = m_pullup(m, l4offset + sizeof(*th));
280 1.1 rin if (m == NULL)
281 1.1 rin return NULL;
282 1.1 rin }
283 1.1 rin th = (void *)(mtod(m, char *) + l4offset);
284 1.1 rin osum = th->th_sum;
285 1.1 rin th->th_sum = sum;
286 1.2 rin #ifdef INET6
287 1.2 rin if (v6) {
288 1.2 rin flags |= M_CSUM_TCPv6;
289 1.2 rin sum = in6_cksum(m, 0, l4offset, len);
290 1.2 rin } else
291 1.2 rin #endif
292 1.2 rin {
293 1.1 rin flags |= M_CSUM_TCPv4;
294 1.1 rin sum = in4_cksum(m, 0, l4offset, len);
295 1.1 rin }
296 1.1 rin if (sum != osum)
297 1.1 rin flags |= M_CSUM_TCP_UDP_BAD;
298 1.1 rin th->th_sum = osum;
299 1.1 rin break;
300 1.1 rin case IPPROTO_UDP:
301 1.1 rin KASSERT(len >= sizeof(*uh));
302 1.1 rin if (m->m_len < l4offset + sizeof(*uh)) {
303 1.1 rin m = m_pullup(m, l4offset + sizeof(*uh));
304 1.1 rin if (m == NULL)
305 1.1 rin return NULL;
306 1.1 rin }
307 1.1 rin uh = (void *)(mtod(m, char *) + l4offset);
308 1.1 rin osum = uh->uh_sum;
309 1.1 rin if (osum == 0)
310 1.1 rin break;
311 1.1 rin uh->uh_sum = sum;
312 1.2 rin #ifdef INET6
313 1.2 rin if (v6) {
314 1.2 rin flags |= M_CSUM_UDPv6;
315 1.2 rin sum = in6_cksum(m, 0, l4offset, len);
316 1.2 rin } else
317 1.2 rin #endif
318 1.2 rin {
319 1.1 rin flags |= M_CSUM_UDPv4;
320 1.1 rin sum = in4_cksum(m, 0, l4offset, len);
321 1.1 rin }
322 1.1 rin if (sum == 0)
323 1.1 rin sum = 0xffff;
324 1.1 rin if (sum != osum)
325 1.1 rin flags |= M_CSUM_TCP_UDP_BAD;
326 1.1 rin uh->uh_sum = osum;
327 1.1 rin break;
328 1.1 rin default:
329 1.1 rin panic("%s: impossible", __func__);
330 1.1 rin break;
331 1.1 rin }
332 1.1 rin
333 1.1 rin done:
334 1.1 rin m->m_pkthdr.csum_flags = flags;
335 1.1 rin return m;
336 1.1 rin }
337