Home | History | Annotate | Line # | Download | only in netinet
in_offload.c revision 1.3.2.1
      1  1.3.2.1  jruoho /*	$NetBSD: in_offload.c,v 1.3.2.1 2011/06/06 09:09:55 jruoho Exp $	*/
      2      1.1    yamt 
      3      1.1    yamt /*-
      4      1.1    yamt  * Copyright (c)2005, 2006 YAMAMOTO Takashi,
      5      1.1    yamt  * All rights reserved.
      6      1.1    yamt  *
      7      1.1    yamt  * Redistribution and use in source and binary forms, with or without
      8      1.1    yamt  * modification, are permitted provided that the following conditions
      9      1.1    yamt  * are met:
     10      1.1    yamt  * 1. Redistributions of source code must retain the above copyright
     11      1.1    yamt  *    notice, this list of conditions and the following disclaimer.
     12      1.1    yamt  * 2. Redistributions in binary form must reproduce the above copyright
     13      1.1    yamt  *    notice, this list of conditions and the following disclaimer in the
     14      1.1    yamt  *    documentation and/or other materials provided with the distribution.
     15      1.1    yamt  *
     16      1.1    yamt  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
     17      1.1    yamt  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     18      1.1    yamt  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     19      1.1    yamt  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     20      1.1    yamt  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     21      1.1    yamt  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     22      1.1    yamt  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     23      1.1    yamt  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     24      1.1    yamt  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     25      1.1    yamt  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     26      1.1    yamt  * SUCH DAMAGE.
     27      1.1    yamt  */
     28      1.1    yamt 
     29      1.1    yamt #include <sys/cdefs.h>
     30  1.3.2.1  jruoho __KERNEL_RCSID(0, "$NetBSD: in_offload.c,v 1.3.2.1 2011/06/06 09:09:55 jruoho Exp $");
     31      1.1    yamt 
     32      1.1    yamt #include <sys/param.h>
     33      1.1    yamt #include <sys/mbuf.h>
     34      1.1    yamt 
     35      1.1    yamt #include <net/if.h>
     36      1.1    yamt 
     37      1.1    yamt #include <netinet/in.h>
     38      1.1    yamt #include <netinet/in_systm.h>
     39      1.1    yamt #include <netinet/ip.h>
     40      1.1    yamt #include <netinet/tcp.h>
     41      1.1    yamt #include <netinet/in_offload.h>
     42      1.1    yamt 
     43      1.1    yamt struct ip_tso_output_args {
     44      1.1    yamt 	struct ifnet *ifp;
     45      1.2  dyoung 	const struct sockaddr *sa;
     46      1.1    yamt 	struct rtentry *rt;
     47      1.1    yamt };
     48      1.1    yamt 
     49      1.1    yamt static int ip_tso_output_callback(void *, struct mbuf *);
     50      1.1    yamt 
     51      1.1    yamt static int
     52      1.1    yamt ip_tso_output_callback(void *vp, struct mbuf *m)
     53      1.1    yamt {
     54      1.1    yamt 	struct ip_tso_output_args *args = vp;
     55      1.1    yamt 	struct ifnet *ifp = args->ifp;
     56  1.3.2.1  jruoho 	int error;
     57      1.1    yamt 
     58  1.3.2.1  jruoho 	KERNEL_LOCK(1, NULL);
     59  1.3.2.1  jruoho 	error = (*ifp->if_output)(ifp, m, args->sa, args->rt);
     60  1.3.2.1  jruoho 	KERNEL_UNLOCK_ONE(NULL);
     61  1.3.2.1  jruoho 	return error;
     62      1.1    yamt }
     63      1.1    yamt 
     64      1.1    yamt int
     65      1.2  dyoung ip_tso_output(struct ifnet *ifp, struct mbuf *m, const struct sockaddr *sa,
     66      1.1    yamt     struct rtentry *rt)
     67      1.1    yamt {
     68      1.1    yamt 	struct ip_tso_output_args args;
     69      1.1    yamt 
     70      1.1    yamt 	args.ifp = ifp;
     71      1.1    yamt 	args.sa = sa;
     72      1.1    yamt 	args.rt = rt;
     73      1.1    yamt 
     74      1.1    yamt 	return tcp4_segment(m, ip_tso_output_callback, &args);
     75      1.1    yamt }
     76      1.1    yamt 
     77      1.1    yamt /*
     78      1.1    yamt  * tcp4_segment: handle M_CSUM_TSOv4 by software.
     79      1.1    yamt  *
     80      1.1    yamt  * => always consume m.
     81      1.1    yamt  * => call output_func with output_arg for each segments.
     82      1.1    yamt  */
     83      1.1    yamt 
     84      1.1    yamt int
     85      1.1    yamt tcp4_segment(struct mbuf *m, int (*output_func)(void *, struct mbuf *),
     86      1.1    yamt     void *output_arg)
     87      1.1    yamt {
     88      1.1    yamt 	int mss;
     89      1.1    yamt 	int iphlen;
     90      1.1    yamt 	int thlen;
     91      1.1    yamt 	int hlen;
     92      1.1    yamt 	int len;
     93      1.1    yamt 	struct ip *iph;
     94      1.1    yamt 	struct tcphdr *th;
     95      1.1    yamt 	uint16_t ipid;
     96      1.1    yamt 	uint32_t tcpseq;
     97      1.1    yamt 	struct mbuf *hdr = NULL;
     98      1.1    yamt 	struct mbuf *t;
     99      1.1    yamt 	int error = 0;
    100      1.1    yamt 
    101      1.1    yamt 	KASSERT((m->m_flags & M_PKTHDR) != 0);
    102      1.1    yamt 	KASSERT((m->m_pkthdr.csum_flags & M_CSUM_TSOv4) != 0);
    103      1.1    yamt 
    104      1.1    yamt 	m->m_pkthdr.csum_flags = 0;
    105      1.1    yamt 
    106      1.1    yamt 	len = m->m_pkthdr.len;
    107      1.1    yamt 	KASSERT(len >= sizeof(*iph) + sizeof(*th));
    108      1.1    yamt 
    109      1.1    yamt 	if (m->m_len < sizeof(*iph)) {
    110      1.1    yamt 		m = m_pullup(m, sizeof(*iph));
    111      1.1    yamt 		if (m == NULL) {
    112      1.1    yamt 			error = ENOMEM;
    113      1.1    yamt 			goto quit;
    114      1.1    yamt 		}
    115      1.1    yamt 	}
    116      1.1    yamt 	iph = mtod(m, struct ip *);
    117      1.1    yamt 	iphlen = iph->ip_hl * 4;
    118      1.1    yamt 	KASSERT(iph->ip_v == IPVERSION);
    119      1.1    yamt 	KASSERT(iphlen >= sizeof(*iph));
    120      1.1    yamt 	KASSERT(iph->ip_p == IPPROTO_TCP);
    121      1.1    yamt 	ipid = ntohs(iph->ip_id);
    122      1.1    yamt 
    123      1.1    yamt 	hlen = iphlen + sizeof(*th);
    124      1.1    yamt 	if (m->m_len < hlen) {
    125      1.1    yamt 		m = m_pullup(m, hlen);
    126      1.1    yamt 		if (m == NULL) {
    127      1.1    yamt 			error = ENOMEM;
    128      1.1    yamt 			goto quit;
    129      1.1    yamt 		}
    130      1.1    yamt 	}
    131      1.1    yamt 	th = (void *)(mtod(m, char *) + iphlen);
    132      1.1    yamt 	tcpseq = ntohl(th->th_seq);
    133      1.1    yamt 	thlen = th->th_off * 4;
    134      1.1    yamt 	hlen = iphlen + thlen;
    135      1.1    yamt 
    136      1.1    yamt 	mss = m->m_pkthdr.segsz;
    137      1.1    yamt 	KASSERT(mss != 0);
    138      1.1    yamt 	KASSERT(len > hlen);
    139      1.1    yamt 
    140      1.1    yamt 	t = m_split(m, hlen, M_NOWAIT);
    141      1.1    yamt 	if (t == NULL) {
    142      1.1    yamt 		error = ENOMEM;
    143      1.1    yamt 		goto quit;
    144      1.1    yamt 	}
    145      1.1    yamt 	hdr = m;
    146      1.1    yamt 	m = t;
    147      1.1    yamt 	len -= hlen;
    148      1.1    yamt 	KASSERT(len % mss == 0);
    149      1.1    yamt 	while (len > 0) {
    150      1.1    yamt 		struct mbuf *n;
    151      1.1    yamt 
    152      1.1    yamt 		n = m_dup(hdr, 0, hlen, M_NOWAIT);
    153      1.1    yamt 		if (n == NULL) {
    154      1.1    yamt 			error = ENOMEM;
    155      1.1    yamt 			goto quit;
    156      1.1    yamt 		}
    157      1.1    yamt 		KASSERT(n->m_len == hlen); /* XXX */
    158      1.1    yamt 
    159      1.1    yamt 		t = m_split(m, mss, M_NOWAIT);
    160      1.1    yamt 		if (t == NULL) {
    161      1.1    yamt 			m_freem(n);
    162      1.1    yamt 			error = ENOMEM;
    163      1.1    yamt 			goto quit;
    164      1.1    yamt 		}
    165      1.1    yamt 		m_cat(n, m);
    166      1.1    yamt 		m = t;
    167      1.1    yamt 
    168      1.1    yamt 		KASSERT(n->m_len >= hlen); /* XXX */
    169      1.1    yamt 
    170      1.1    yamt 		n->m_pkthdr.len = hlen + mss;
    171      1.1    yamt 		iph = mtod(n, struct ip *);
    172      1.1    yamt 		KASSERT(iph->ip_v == IPVERSION);
    173      1.1    yamt 		iph->ip_len = htons(n->m_pkthdr.len);
    174      1.1    yamt 		iph->ip_id = htons(ipid);
    175      1.1    yamt 		th = (void *)(mtod(n, char *) + iphlen);
    176      1.1    yamt 		th->th_seq = htonl(tcpseq);
    177      1.1    yamt 		iph->ip_sum = 0;
    178      1.1    yamt 		iph->ip_sum = in_cksum(n, iphlen);
    179      1.1    yamt 		th->th_sum = 0;
    180      1.1    yamt 		th->th_sum = in4_cksum(n, IPPROTO_TCP, iphlen, thlen + mss);
    181      1.1    yamt 
    182      1.1    yamt 		error = (*output_func)(output_arg, n);
    183      1.1    yamt 		if (error) {
    184      1.1    yamt 			goto quit;
    185      1.1    yamt 		}
    186      1.1    yamt 
    187      1.1    yamt 		tcpseq += mss;
    188      1.1    yamt 		ipid++;
    189      1.1    yamt 		len -= mss;
    190      1.1    yamt 	}
    191      1.1    yamt 
    192      1.1    yamt quit:
    193      1.1    yamt 	if (hdr != NULL) {
    194      1.1    yamt 		m_freem(hdr);
    195      1.1    yamt 	}
    196      1.1    yamt 	if (m != NULL) {
    197      1.1    yamt 		m_freem(m);
    198      1.1    yamt 	}
    199      1.1    yamt 
    200      1.1    yamt 	return error;
    201      1.1    yamt }
    202      1.3    matt 
    203      1.3    matt void
    204      1.3    matt ip_undefer_csum(struct mbuf *m, size_t hdrlen, int csum_flags)
    205      1.3    matt {
    206  1.3.2.1  jruoho 	const size_t iphdrlen = M_CSUM_DATA_IPv4_IPHL(m->m_pkthdr.csum_data);
    207      1.3    matt 	uint16_t csum;
    208      1.3    matt 	uint16_t ip_len;
    209      1.3    matt 	uint16_t *csump;
    210  1.3.2.1  jruoho 
    211  1.3.2.1  jruoho 	KASSERT(m->m_flags & M_PKTHDR);
    212  1.3.2.1  jruoho 	KASSERT((m->m_pkthdr.csum_flags & csum_flags) == csum_flags);
    213      1.3    matt 
    214      1.3    matt 	if (__predict_true(hdrlen + sizeof(struct ip) <= m->m_len)) {
    215      1.3    matt 		struct ip *ip = (struct ip *)(mtod(m, uint8_t *) + hdrlen);
    216  1.3.2.1  jruoho 
    217      1.3    matt 		ip_len = ip->ip_len;
    218      1.3    matt 		csump = &ip->ip_sum;
    219      1.3    matt 	} else {
    220  1.3.2.1  jruoho 		const size_t ip_len_offset =
    221  1.3.2.1  jruoho 		    hdrlen + offsetof(struct ip, ip_len);
    222  1.3.2.1  jruoho 
    223      1.3    matt 		m_copydata(m, ip_len_offset, sizeof(ip_len), &ip_len);
    224      1.3    matt 		csump = NULL;
    225      1.3    matt 	}
    226  1.3.2.1  jruoho 	ip_len = ntohs(ip_len);
    227      1.3    matt 
    228      1.3    matt 	if (csum_flags & M_CSUM_IPv4) {
    229      1.3    matt 		csum = in4_cksum(m, 0, hdrlen, iphdrlen);
    230      1.3    matt 		if (csump != NULL) {
    231      1.3    matt 			*csump = csum;
    232      1.3    matt 		} else {
    233  1.3.2.1  jruoho 			const size_t offset = hdrlen +
    234  1.3.2.1  jruoho 			    offsetof(struct ip, ip_sum);
    235  1.3.2.1  jruoho 
    236      1.3    matt 			m_copyback(m, offset, sizeof(uint16_t), &csum);
    237      1.3    matt 		}
    238      1.3    matt 	}
    239      1.3    matt 
    240      1.3    matt 	if (csum_flags & (M_CSUM_UDPv4|M_CSUM_TCPv4)) {
    241  1.3.2.1  jruoho 		size_t l4offset = hdrlen + iphdrlen;
    242      1.3    matt 
    243  1.3.2.1  jruoho 		csum = in4_cksum(m, 0, l4offset, ip_len - l4offset - hdrlen);
    244      1.3    matt 		if (csum == 0 && (csum_flags & M_CSUM_UDPv4) != 0)
    245      1.3    matt 			csum = 0xffff;
    246      1.3    matt 
    247      1.3    matt 		l4offset += M_CSUM_DATA_IPv4_OFFSET(m->m_pkthdr.csum_data);
    248      1.3    matt 
    249      1.3    matt 		if (__predict_true(l4offset + sizeof(uint16_t) <= m->m_len)) {
    250      1.3    matt 			*(uint16_t *)(mtod(m, char *) + l4offset) = csum;
    251      1.3    matt 		} else {
    252      1.3    matt 			m_copyback(m, l4offset, sizeof(csum), (void *) &csum);
    253      1.3    matt 		}
    254      1.3    matt 	}
    255      1.3    matt 
    256      1.3    matt 	m->m_pkthdr.csum_flags ^= csum_flags;
    257      1.3    matt }
    258