Home | History | Annotate | Line # | Download | only in netinet6
ip6_output.c revision 1.124
      1  1.124    dyoung /*	$NetBSD: ip6_output.c,v 1.124 2007/12/20 19:53:34 dyoung Exp $	*/
      2   1.33    itojun /*	$KAME: ip6_output.c,v 1.172 2001/03/25 09:55:56 itojun Exp $	*/
      3    1.3   thorpej 
      4    1.2    itojun /*
      5    1.2    itojun  * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project.
      6    1.2    itojun  * All rights reserved.
      7   1.19    itojun  *
      8    1.2    itojun  * Redistribution and use in source and binary forms, with or without
      9    1.2    itojun  * modification, are permitted provided that the following conditions
     10    1.2    itojun  * are met:
     11    1.2    itojun  * 1. Redistributions of source code must retain the above copyright
     12    1.2    itojun  *    notice, this list of conditions and the following disclaimer.
     13    1.2    itojun  * 2. Redistributions in binary form must reproduce the above copyright
     14    1.2    itojun  *    notice, this list of conditions and the following disclaimer in the
     15    1.2    itojun  *    documentation and/or other materials provided with the distribution.
     16    1.2    itojun  * 3. Neither the name of the project nor the names of its contributors
     17    1.2    itojun  *    may be used to endorse or promote products derived from this software
     18    1.2    itojun  *    without specific prior written permission.
     19   1.19    itojun  *
     20    1.2    itojun  * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND
     21    1.2    itojun  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     22    1.2    itojun  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     23    1.2    itojun  * ARE DISCLAIMED.  IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE
     24    1.2    itojun  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     25    1.2    itojun  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     26    1.2    itojun  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     27    1.2    itojun  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     28    1.2    itojun  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     29    1.2    itojun  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     30    1.2    itojun  * SUCH DAMAGE.
     31    1.2    itojun  */
     32    1.2    itojun 
     33    1.2    itojun /*
     34    1.2    itojun  * Copyright (c) 1982, 1986, 1988, 1990, 1993
     35    1.2    itojun  *	The Regents of the University of California.  All rights reserved.
     36    1.2    itojun  *
     37    1.2    itojun  * Redistribution and use in source and binary forms, with or without
     38    1.2    itojun  * modification, are permitted provided that the following conditions
     39    1.2    itojun  * are met:
     40    1.2    itojun  * 1. Redistributions of source code must retain the above copyright
     41    1.2    itojun  *    notice, this list of conditions and the following disclaimer.
     42    1.2    itojun  * 2. Redistributions in binary form must reproduce the above copyright
     43    1.2    itojun  *    notice, this list of conditions and the following disclaimer in the
     44    1.2    itojun  *    documentation and/or other materials provided with the distribution.
     45   1.62       agc  * 3. Neither the name of the University nor the names of its contributors
     46    1.2    itojun  *    may be used to endorse or promote products derived from this software
     47    1.2    itojun  *    without specific prior written permission.
     48    1.2    itojun  *
     49    1.2    itojun  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     50    1.2    itojun  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     51    1.2    itojun  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     52    1.2    itojun  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     53    1.2    itojun  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     54    1.2    itojun  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     55    1.2    itojun  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     56    1.2    itojun  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     57    1.2    itojun  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     58    1.2    itojun  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     59    1.2    itojun  * SUCH DAMAGE.
     60    1.2    itojun  *
     61    1.2    itojun  *	@(#)ip_output.c	8.3 (Berkeley) 1/21/94
     62    1.2    itojun  */
     63   1.41     lukem 
     64   1.41     lukem #include <sys/cdefs.h>
     65  1.124    dyoung __KERNEL_RCSID(0, "$NetBSD: ip6_output.c,v 1.124 2007/12/20 19:53:34 dyoung Exp $");
     66    1.2    itojun 
     67    1.2    itojun #include "opt_inet.h"
     68   1.97    rpaulo #include "opt_inet6.h"
     69    1.4   thorpej #include "opt_ipsec.h"
     70   1.15   darrenr #include "opt_pfil_hooks.h"
     71    1.2    itojun 
     72    1.2    itojun #include <sys/param.h>
     73    1.2    itojun #include <sys/malloc.h>
     74    1.2    itojun #include <sys/mbuf.h>
     75    1.2    itojun #include <sys/errno.h>
     76    1.2    itojun #include <sys/protosw.h>
     77    1.2    itojun #include <sys/socket.h>
     78    1.2    itojun #include <sys/socketvar.h>
     79    1.2    itojun #include <sys/systm.h>
     80    1.2    itojun #include <sys/proc.h>
     81   1.98      elad #include <sys/kauth.h>
     82    1.2    itojun 
     83    1.2    itojun #include <net/if.h>
     84    1.2    itojun #include <net/route.h>
     85   1.15   darrenr #ifdef PFIL_HOOKS
     86   1.15   darrenr #include <net/pfil.h>
     87   1.15   darrenr #endif
     88    1.2    itojun 
     89    1.2    itojun #include <netinet/in.h>
     90    1.2    itojun #include <netinet/in_var.h>
     91   1.14    itojun #include <netinet/ip6.h>
     92   1.14    itojun #include <netinet/icmp6.h>
     93   1.90      yamt #include <netinet/in_offload.h>
     94  1.105      yamt #include <netinet6/in6_offload.h>
     95   1.10    itojun #include <netinet6/ip6_var.h>
     96    1.2    itojun #include <netinet6/in6_pcb.h>
     97    1.2    itojun #include <netinet6/nd6.h>
     98   1.78    itojun #include <netinet6/ip6protosw.h>
     99   1.94    rpaulo #include <netinet6/scope6_var.h>
    100    1.2    itojun 
    101    1.2    itojun #ifdef IPSEC
    102    1.2    itojun #include <netinet6/ipsec.h>
    103    1.2    itojun #include <netkey/key.h>
    104    1.2    itojun #endif /* IPSEC */
    105    1.2    itojun 
    106  1.114  degroote #ifdef FAST_IPSEC
    107  1.114  degroote #include <netipsec/ipsec.h>
    108  1.114  degroote #include <netipsec/ipsec6.h>
    109  1.114  degroote #include <netipsec/key.h>
    110  1.114  degroote #include <netipsec/xform.h>
    111  1.114  degroote #endif
    112  1.114  degroote 
    113  1.114  degroote 
    114    1.9    itojun #include <net/net_osdep.h>
    115    1.9    itojun 
    116   1.27   thorpej #ifdef PFIL_HOOKS
    117   1.27   thorpej extern struct pfil_head inet6_pfil_hook;	/* XXX */
    118   1.27   thorpej #endif
    119   1.27   thorpej 
    120    1.2    itojun struct ip6_exthdrs {
    121    1.2    itojun 	struct mbuf *ip6e_ip6;
    122    1.2    itojun 	struct mbuf *ip6e_hbh;
    123    1.2    itojun 	struct mbuf *ip6e_dest1;
    124    1.2    itojun 	struct mbuf *ip6e_rthdr;
    125    1.2    itojun 	struct mbuf *ip6e_dest2;
    126    1.2    itojun };
    127    1.2    itojun 
    128  1.122    dyoung static int ip6_pcbopt(int, u_char *, int, struct ip6_pktopts **,
    129  1.122    dyoung 	int, int);
    130  1.122    dyoung static int ip6_getpcbopt(struct ip6_pktopts *, int, struct mbuf **);
    131  1.122    dyoung static int ip6_setpktopt(int, u_char *, int, struct ip6_pktopts *, int,
    132  1.122    dyoung 	int, int, int);
    133  1.122    dyoung static int ip6_setmoptions(int, struct ip6_moptions **, struct mbuf *);
    134  1.122    dyoung static int ip6_getmoptions(int, struct ip6_moptions *, struct mbuf **);
    135  1.122    dyoung static int ip6_copyexthdr(struct mbuf **, void *, int);
    136  1.122    dyoung static int ip6_insertfraghdr(struct mbuf *, struct mbuf *, int,
    137  1.122    dyoung 	struct ip6_frag **);
    138  1.122    dyoung static int ip6_insert_jumboopt(struct ip6_exthdrs *, u_int32_t);
    139  1.122    dyoung static int ip6_splithdr(struct mbuf *, struct ip6_exthdrs *);
    140  1.118    dyoung static int ip6_getpmtu(struct route *, struct route *, struct ifnet *,
    141  1.115    dyoung     const struct in6_addr *, u_long *, int *);
    142  1.122    dyoung static int copypktopts(struct ip6_pktopts *, struct ip6_pktopts *, int);
    143   1.97    rpaulo 
    144   1.97    rpaulo #ifdef RFC2292
    145  1.122    dyoung static int ip6_pcbopts(struct ip6_pktopts **, struct mbuf *,
    146  1.122    dyoung 	struct socket *);
    147   1.97    rpaulo #endif
    148    1.2    itojun 
    149   1.90      yamt #define	IN6_NEED_CHECKSUM(ifp, csum_flags) \
    150   1.90      yamt 	(__predict_true(((ifp)->if_flags & IFF_LOOPBACK) == 0 || \
    151   1.90      yamt 	(((csum_flags) & M_CSUM_UDPv6) != 0 && udp_do_loopback_cksum) || \
    152   1.90      yamt 	(((csum_flags) & M_CSUM_TCPv6) != 0 && tcp_do_loopback_cksum)))
    153   1.90      yamt 
    154    1.2    itojun /*
    155    1.2    itojun  * IP6 output. The packet in mbuf chain m contains a skeletal IP6
    156    1.2    itojun  * header (with pri, len, nxt, hlim, src, dst).
    157    1.2    itojun  * This function may modify ver and hlim only.
    158    1.2    itojun  * The mbuf chain containing the packet will be freed.
    159    1.2    itojun  * The mbuf opt, if present, will not be freed.
    160   1.52    itojun  *
    161   1.52    itojun  * type of "mtu": rt_rmx.rmx_mtu is u_long, ifnet.ifr_mtu is int, and
    162   1.52    itojun  * nd_ifinfo.linkmtu is u_int32_t.  so we use u_long to hold largest one,
    163   1.52    itojun  * which is rt_rmx.rmx_mtu.
    164    1.2    itojun  */
    165    1.2    itojun int
    166  1.103  christos ip6_output(
    167  1.103  christos     struct mbuf *m0,
    168  1.103  christos     struct ip6_pktopts *opt,
    169  1.118    dyoung     struct route *ro,
    170  1.103  christos     int flags,
    171  1.103  christos     struct ip6_moptions *im6o,
    172  1.104  christos     struct socket *so,
    173  1.103  christos     struct ifnet **ifpp		/* XXX: just for statistics */
    174  1.103  christos )
    175    1.2    itojun {
    176    1.2    itojun 	struct ip6_hdr *ip6, *mhip6;
    177   1.19    itojun 	struct ifnet *ifp, *origifp;
    178    1.2    itojun 	struct mbuf *m = m0;
    179    1.2    itojun 	int hlen, tlen, len, off;
    180  1.116   thorpej 	bool tso;
    181  1.118    dyoung 	struct route ip6route;
    182   1.94    rpaulo 	struct rtentry *rt = NULL;
    183  1.118    dyoung 	const struct sockaddr_in6 *dst = NULL;
    184  1.118    dyoung 	struct sockaddr_in6 src_sa, dst_sa;
    185    1.2    itojun 	int error = 0;
    186   1.94    rpaulo 	struct in6_ifaddr *ia = NULL;
    187    1.2    itojun 	u_long mtu;
    188   1.78    itojun 	int alwaysfrag, dontfrag;
    189    1.2    itojun 	u_int32_t optlen = 0, plen = 0, unfragpartlen = 0;
    190    1.2    itojun 	struct ip6_exthdrs exthdrs;
    191   1.94    rpaulo 	struct in6_addr finaldst, src0, dst0;
    192   1.94    rpaulo 	u_int32_t zone;
    193  1.118    dyoung 	struct route *ro_pmtu = NULL;
    194    1.2    itojun 	int hdrsplit = 0;
    195    1.2    itojun 	int needipsec = 0;
    196    1.2    itojun #ifdef IPSEC
    197    1.2    itojun 	int needipsectun = 0;
    198    1.2    itojun 	struct secpolicy *sp = NULL;
    199    1.2    itojun 
    200    1.2    itojun 	ip6 = mtod(m, struct ip6_hdr *);
    201    1.2    itojun #endif /* IPSEC */
    202  1.114  degroote #ifdef FAST_IPSEC
    203  1.114  degroote 	struct secpolicy *sp = NULL;
    204  1.114  degroote 	int s;
    205  1.114  degroote #endif
    206  1.114  degroote 
    207  1.124    dyoung 	memset(&ip6route, 0, sizeof(ip6route));
    208    1.2    itojun 
    209  1.100      tron #ifdef  DIAGNOSTIC
    210  1.100      tron 	if ((m->m_flags & M_PKTHDR) == 0)
    211  1.100      tron 		panic("ip6_output: no HDR");
    212  1.100      tron 
    213  1.100      tron 	if ((m->m_pkthdr.csum_flags &
    214  1.100      tron 	    (M_CSUM_TCPv4|M_CSUM_UDPv4|M_CSUM_TSOv4)) != 0) {
    215  1.100      tron 		panic("ip6_output: IPv4 checksum offload flags: %d",
    216  1.100      tron 		    m->m_pkthdr.csum_flags);
    217  1.100      tron 	}
    218  1.100      tron 
    219  1.100      tron 	if ((m->m_pkthdr.csum_flags & (M_CSUM_TCPv6|M_CSUM_UDPv6)) ==
    220  1.100      tron 	    (M_CSUM_TCPv6|M_CSUM_UDPv6)) {
    221  1.100      tron 		panic("ip6_output: conflicting checksum offload flags: %d",
    222  1.100      tron 		    m->m_pkthdr.csum_flags);
    223  1.100      tron 	}
    224  1.100      tron #endif
    225  1.100      tron 
    226   1.89      yamt 	M_CSUM_DATA_IPv6_HL_SET(m->m_pkthdr.csum_data, sizeof(struct ip6_hdr));
    227   1.89      yamt 
    228   1.22    itojun #define MAKE_EXTHDR(hp, mp)						\
    229   1.22    itojun     do {								\
    230    1.2    itojun 	if (hp) {							\
    231    1.2    itojun 		struct ip6_ext *eh = (struct ip6_ext *)(hp);		\
    232  1.117  christos 		error = ip6_copyexthdr((mp), (void *)(hp), 		\
    233   1.49    itojun 		    ((eh)->ip6e_len + 1) << 3);				\
    234    1.2    itojun 		if (error)						\
    235    1.2    itojun 			goto freehdrs;					\
    236    1.2    itojun 	}								\
    237   1.60     perry     } while (/*CONSTCOND*/ 0)
    238   1.51    itojun 
    239    1.2    itojun 	bzero(&exthdrs, sizeof(exthdrs));
    240    1.2    itojun 	if (opt) {
    241    1.2    itojun 		/* Hop-by-Hop options header */
    242    1.2    itojun 		MAKE_EXTHDR(opt->ip6po_hbh, &exthdrs.ip6e_hbh);
    243    1.2    itojun 		/* Destination options header(1st part) */
    244    1.2    itojun 		MAKE_EXTHDR(opt->ip6po_dest1, &exthdrs.ip6e_dest1);
    245    1.2    itojun 		/* Routing header */
    246    1.2    itojun 		MAKE_EXTHDR(opt->ip6po_rthdr, &exthdrs.ip6e_rthdr);
    247    1.2    itojun 		/* Destination options header(2nd part) */
    248    1.2    itojun 		MAKE_EXTHDR(opt->ip6po_dest2, &exthdrs.ip6e_dest2);
    249    1.2    itojun 	}
    250    1.2    itojun 
    251    1.2    itojun #ifdef IPSEC
    252   1.76    itojun 	if ((flags & IPV6_FORWARDING) != 0) {
    253   1.76    itojun 		needipsec = 0;
    254   1.76    itojun 		goto skippolicycheck;
    255   1.76    itojun 	}
    256   1.76    itojun 
    257    1.2    itojun 	/* get a security policy for this packet */
    258    1.2    itojun 	if (so == NULL)
    259   1.13    itojun 		sp = ipsec6_getpolicybyaddr(m, IPSEC_DIR_OUTBOUND, 0, &error);
    260   1.81   thorpej 	else {
    261   1.81   thorpej 		if (IPSEC_PCB_SKIP_IPSEC(sotoinpcb_hdr(so)->inph_sp,
    262   1.81   thorpej 					 IPSEC_DIR_OUTBOUND)) {
    263   1.81   thorpej 			needipsec = 0;
    264   1.81   thorpej 			goto skippolicycheck;
    265   1.81   thorpej 		}
    266   1.13    itojun 		sp = ipsec6_getpolicybysock(m, IPSEC_DIR_OUTBOUND, so, &error);
    267   1.81   thorpej 	}
    268    1.2    itojun 
    269    1.2    itojun 	if (sp == NULL) {
    270    1.2    itojun 		ipsec6stat.out_inval++;
    271   1.23    itojun 		goto freehdrs;
    272    1.2    itojun 	}
    273    1.2    itojun 
    274    1.2    itojun 	error = 0;
    275    1.2    itojun 
    276    1.2    itojun 	/* check policy */
    277    1.2    itojun 	switch (sp->policy) {
    278    1.2    itojun 	case IPSEC_POLICY_DISCARD:
    279    1.2    itojun 		/*
    280    1.2    itojun 		 * This packet is just discarded.
    281    1.2    itojun 		 */
    282    1.2    itojun 		ipsec6stat.out_polvio++;
    283   1.23    itojun 		goto freehdrs;
    284    1.2    itojun 
    285    1.2    itojun 	case IPSEC_POLICY_BYPASS:
    286    1.2    itojun 	case IPSEC_POLICY_NONE:
    287    1.2    itojun 		/* no need to do IPsec. */
    288    1.2    itojun 		needipsec = 0;
    289    1.2    itojun 		break;
    290   1.51    itojun 
    291    1.2    itojun 	case IPSEC_POLICY_IPSEC:
    292    1.2    itojun 		if (sp->req == NULL) {
    293    1.2    itojun 			/* XXX should be panic ? */
    294    1.2    itojun 			printf("ip6_output: No IPsec request specified.\n");
    295    1.2    itojun 			error = EINVAL;
    296   1.23    itojun 			goto freehdrs;
    297    1.2    itojun 		}
    298    1.2    itojun 		needipsec = 1;
    299    1.2    itojun 		break;
    300    1.2    itojun 
    301    1.2    itojun 	case IPSEC_POLICY_ENTRUST:
    302    1.2    itojun 	default:
    303    1.2    itojun 		printf("ip6_output: Invalid policy found. %d\n", sp->policy);
    304    1.2    itojun 	}
    305   1.76    itojun 
    306   1.76    itojun   skippolicycheck:;
    307    1.2    itojun #endif /* IPSEC */
    308    1.2    itojun 
    309    1.2    itojun 	/*
    310    1.2    itojun 	 * Calculate the total length of the extension header chain.
    311    1.2    itojun 	 * Keep the length of the unfragmentable part for fragmentation.
    312    1.2    itojun 	 */
    313    1.9    itojun 	optlen = 0;
    314    1.2    itojun 	if (exthdrs.ip6e_hbh) optlen += exthdrs.ip6e_hbh->m_len;
    315    1.2    itojun 	if (exthdrs.ip6e_dest1) optlen += exthdrs.ip6e_dest1->m_len;
    316    1.2    itojun 	if (exthdrs.ip6e_rthdr) optlen += exthdrs.ip6e_rthdr->m_len;
    317    1.9    itojun 	unfragpartlen = optlen + sizeof(struct ip6_hdr);
    318    1.2    itojun 	/* NOTE: we don't add AH/ESP length here. do that later. */
    319    1.2    itojun 	if (exthdrs.ip6e_dest2) optlen += exthdrs.ip6e_dest2->m_len;
    320    1.2    itojun 
    321  1.114  degroote #ifdef FAST_IPSEC
    322  1.114  degroote 	/* Check the security policy (SP) for the packet */
    323  1.114  degroote 
    324  1.114  degroote 	/* XXX For moment, we doesn't support packet with extented action */
    325  1.114  degroote 	if (optlen !=0)
    326  1.114  degroote 		goto freehdrs;
    327  1.114  degroote 
    328  1.114  degroote 	sp = ipsec6_check_policy(m,so,flags,&needipsec,&error);
    329  1.114  degroote 	if (error != 0) {
    330  1.114  degroote 		/*
    331  1.114  degroote 		 * Hack: -EINVAL is used to signal that a packet
    332  1.114  degroote 		 * should be silently discarded.  This is typically
    333  1.114  degroote 		 * because we asked key management for an SA and
    334  1.114  degroote 		 * it was delayed (e.g. kicked up to IKE).
    335  1.114  degroote 		 */
    336  1.114  degroote 	if (error == -EINVAL)
    337  1.114  degroote 		error = 0;
    338  1.114  degroote 	goto freehdrs;
    339  1.114  degroote     }
    340  1.114  degroote #endif /* FAST_IPSEC */
    341  1.114  degroote 
    342  1.114  degroote 
    343  1.114  degroote 	if (needipsec &&
    344  1.114  degroote 	    (m->m_pkthdr.csum_flags & (M_CSUM_UDPv6|M_CSUM_TCPv6)) != 0) {
    345  1.114  degroote 		in6_delayed_cksum(m);
    346  1.114  degroote 		m->m_pkthdr.csum_flags &= ~(M_CSUM_UDPv6|M_CSUM_TCPv6);
    347  1.114  degroote 	}
    348  1.114  degroote 
    349  1.114  degroote 
    350    1.2    itojun 	/*
    351    1.2    itojun 	 * If we need IPsec, or there is at least one extension header,
    352    1.2    itojun 	 * separate IP6 header from the payload.
    353    1.2    itojun 	 */
    354    1.2    itojun 	if ((needipsec || optlen) && !hdrsplit) {
    355    1.2    itojun 		if ((error = ip6_splithdr(m, &exthdrs)) != 0) {
    356    1.2    itojun 			m = NULL;
    357    1.2    itojun 			goto freehdrs;
    358    1.2    itojun 		}
    359    1.2    itojun 		m = exthdrs.ip6e_ip6;
    360    1.2    itojun 		hdrsplit++;
    361    1.2    itojun 	}
    362    1.2    itojun 
    363    1.2    itojun 	/* adjust pointer */
    364    1.2    itojun 	ip6 = mtod(m, struct ip6_hdr *);
    365    1.2    itojun 
    366    1.2    itojun 	/* adjust mbuf packet header length */
    367    1.2    itojun 	m->m_pkthdr.len += optlen;
    368    1.2    itojun 	plen = m->m_pkthdr.len - sizeof(*ip6);
    369    1.2    itojun 
    370    1.2    itojun 	/* If this is a jumbo payload, insert a jumbo payload option. */
    371    1.2    itojun 	if (plen > IPV6_MAXPACKET) {
    372    1.2    itojun 		if (!hdrsplit) {
    373    1.2    itojun 			if ((error = ip6_splithdr(m, &exthdrs)) != 0) {
    374    1.2    itojun 				m = NULL;
    375    1.2    itojun 				goto freehdrs;
    376    1.2    itojun 			}
    377    1.2    itojun 			m = exthdrs.ip6e_ip6;
    378    1.2    itojun 			hdrsplit++;
    379    1.2    itojun 		}
    380    1.2    itojun 		/* adjust pointer */
    381    1.2    itojun 		ip6 = mtod(m, struct ip6_hdr *);
    382    1.2    itojun 		if ((error = ip6_insert_jumboopt(&exthdrs, plen)) != 0)
    383    1.2    itojun 			goto freehdrs;
    384   1.89      yamt 		optlen += 8; /* XXX JUMBOOPTLEN */
    385    1.2    itojun 		ip6->ip6_plen = 0;
    386    1.2    itojun 	} else
    387    1.2    itojun 		ip6->ip6_plen = htons(plen);
    388    1.2    itojun 
    389    1.2    itojun 	/*
    390    1.2    itojun 	 * Concatenate headers and fill in next header fields.
    391    1.2    itojun 	 * Here we have, on "m"
    392    1.9    itojun 	 *	IPv6 payload
    393    1.2    itojun 	 * and we insert headers accordingly.  Finally, we should be getting:
    394    1.2    itojun 	 *	IPv6 hbh dest1 rthdr ah* [esp* dest2 payload]
    395    1.9    itojun 	 *
    396    1.9    itojun 	 * during the header composing process, "m" points to IPv6 header.
    397    1.9    itojun 	 * "mprev" points to an extension header prior to esp.
    398    1.2    itojun 	 */
    399    1.2    itojun 	{
    400    1.2    itojun 		u_char *nexthdrp = &ip6->ip6_nxt;
    401    1.2    itojun 		struct mbuf *mprev = m;
    402    1.2    itojun 
    403    1.2    itojun 		/*
    404    1.2    itojun 		 * we treat dest2 specially.  this makes IPsec processing
    405   1.78    itojun 		 * much easier.  the goal here is to make mprev point the
    406   1.78    itojun 		 * mbuf prior to dest2.
    407    1.9    itojun 		 *
    408    1.9    itojun 		 * result: IPv6 dest2 payload
    409    1.9    itojun 		 * m and mprev will point to IPv6 header.
    410    1.2    itojun 		 */
    411    1.2    itojun 		if (exthdrs.ip6e_dest2) {
    412    1.2    itojun 			if (!hdrsplit)
    413    1.2    itojun 				panic("assumption failed: hdr not split");
    414    1.9    itojun 			exthdrs.ip6e_dest2->m_next = m->m_next;
    415    1.9    itojun 			m->m_next = exthdrs.ip6e_dest2;
    416    1.2    itojun 			*mtod(exthdrs.ip6e_dest2, u_char *) = ip6->ip6_nxt;
    417    1.2    itojun 			ip6->ip6_nxt = IPPROTO_DSTOPTS;
    418    1.2    itojun 		}
    419    1.2    itojun 
    420   1.22    itojun #define MAKE_CHAIN(m, mp, p, i)\
    421   1.22    itojun     do {\
    422    1.2    itojun 	if (m) {\
    423    1.2    itojun 		if (!hdrsplit) \
    424    1.2    itojun 			panic("assumption failed: hdr not split"); \
    425    1.2    itojun 		*mtod((m), u_char *) = *(p);\
    426    1.2    itojun 		*(p) = (i);\
    427    1.2    itojun 		p = mtod((m), u_char *);\
    428    1.2    itojun 		(m)->m_next = (mp)->m_next;\
    429    1.2    itojun 		(mp)->m_next = (m);\
    430    1.2    itojun 		(mp) = (m);\
    431    1.2    itojun 	}\
    432   1.60     perry     } while (/*CONSTCOND*/ 0)
    433    1.9    itojun 		/*
    434    1.9    itojun 		 * result: IPv6 hbh dest1 rthdr dest2 payload
    435    1.9    itojun 		 * m will point to IPv6 header.  mprev will point to the
    436    1.9    itojun 		 * extension header prior to dest2 (rthdr in the above case).
    437    1.9    itojun 		 */
    438   1.49    itojun 		MAKE_CHAIN(exthdrs.ip6e_hbh, mprev, nexthdrp, IPPROTO_HOPOPTS);
    439   1.49    itojun 		MAKE_CHAIN(exthdrs.ip6e_dest1, mprev, nexthdrp,
    440   1.49    itojun 		    IPPROTO_DSTOPTS);
    441   1.49    itojun 		MAKE_CHAIN(exthdrs.ip6e_rthdr, mprev, nexthdrp,
    442   1.49    itojun 		    IPPROTO_ROUTING);
    443    1.2    itojun 
    444   1.89      yamt 		M_CSUM_DATA_IPv6_HL_SET(m->m_pkthdr.csum_data,
    445   1.89      yamt 		    sizeof(struct ip6_hdr) + optlen);
    446   1.89      yamt 
    447    1.2    itojun #ifdef IPSEC
    448    1.2    itojun 		if (!needipsec)
    449    1.2    itojun 			goto skip_ipsec2;
    450    1.2    itojun 
    451    1.2    itojun 		/*
    452    1.2    itojun 		 * pointers after IPsec headers are not valid any more.
    453    1.2    itojun 		 * other pointers need a great care too.
    454    1.2    itojun 		 * (IPsec routines should not mangle mbufs prior to AH/ESP)
    455    1.2    itojun 		 */
    456    1.2    itojun 		exthdrs.ip6e_dest2 = NULL;
    457    1.2    itojun 
    458    1.2    itojun 	    {
    459    1.2    itojun 		struct ip6_rthdr *rh = NULL;
    460    1.2    itojun 		int segleft_org = 0;
    461    1.2    itojun 		struct ipsec_output_state state;
    462    1.2    itojun 
    463    1.2    itojun 		if (exthdrs.ip6e_rthdr) {
    464    1.2    itojun 			rh = mtod(exthdrs.ip6e_rthdr, struct ip6_rthdr *);
    465    1.2    itojun 			segleft_org = rh->ip6r_segleft;
    466    1.2    itojun 			rh->ip6r_segleft = 0;
    467    1.2    itojun 		}
    468    1.2    itojun 
    469    1.2    itojun 		bzero(&state, sizeof(state));
    470    1.2    itojun 		state.m = m;
    471    1.2    itojun 		error = ipsec6_output_trans(&state, nexthdrp, mprev, sp, flags,
    472   1.78    itojun 		    &needipsectun);
    473    1.2    itojun 		m = state.m;
    474    1.2    itojun 		if (error) {
    475  1.115    dyoung 			rh = mtod(exthdrs.ip6e_rthdr, struct ip6_rthdr *);
    476    1.2    itojun 			/* mbuf is already reclaimed in ipsec6_output_trans. */
    477    1.2    itojun 			m = NULL;
    478    1.2    itojun 			switch (error) {
    479    1.2    itojun 			case EHOSTUNREACH:
    480    1.2    itojun 			case ENETUNREACH:
    481    1.2    itojun 			case EMSGSIZE:
    482    1.2    itojun 			case ENOBUFS:
    483    1.2    itojun 			case ENOMEM:
    484    1.2    itojun 				break;
    485    1.2    itojun 			default:
    486    1.2    itojun 				printf("ip6_output (ipsec): error code %d\n", error);
    487   1.48    itojun 				/* FALLTHROUGH */
    488    1.2    itojun 			case ENOENT:
    489    1.2    itojun 				/* don't show these error codes to the user */
    490    1.2    itojun 				error = 0;
    491    1.2    itojun 				break;
    492    1.2    itojun 			}
    493    1.2    itojun 			goto bad;
    494    1.2    itojun 		}
    495    1.2    itojun 		if (exthdrs.ip6e_rthdr) {
    496    1.2    itojun 			/* ah6_output doesn't modify mbuf chain */
    497    1.2    itojun 			rh->ip6r_segleft = segleft_org;
    498    1.2    itojun 		}
    499    1.2    itojun 	    }
    500    1.2    itojun skip_ipsec2:;
    501    1.2    itojun #endif
    502    1.2    itojun 	}
    503    1.2    itojun 
    504    1.2    itojun 	/*
    505    1.2    itojun 	 * If there is a routing header, replace destination address field
    506    1.2    itojun 	 * with the first hop of the routing header.
    507    1.2    itojun 	 */
    508    1.2    itojun 	if (exthdrs.ip6e_rthdr) {
    509   1.49    itojun 		struct ip6_rthdr *rh;
    510    1.2    itojun 		struct ip6_rthdr0 *rh0;
    511   1.61    itojun 		struct in6_addr *addr;
    512   1.94    rpaulo 		struct sockaddr_in6 sa;
    513    1.2    itojun 
    514   1.49    itojun 		rh = (struct ip6_rthdr *)(mtod(exthdrs.ip6e_rthdr,
    515   1.49    itojun 		    struct ip6_rthdr *));
    516    1.2    itojun 		finaldst = ip6->ip6_dst;
    517   1.31    itojun 		switch (rh->ip6r_type) {
    518    1.2    itojun 		case IPV6_RTHDR_TYPE_0:
    519    1.2    itojun 			 rh0 = (struct ip6_rthdr0 *)rh;
    520   1.61    itojun 			 addr = (struct in6_addr *)(rh0 + 1);
    521   1.94    rpaulo 
    522   1.94    rpaulo 			 /*
    523   1.94    rpaulo 			  * construct a sockaddr_in6 form of
    524   1.94    rpaulo 			  * the first hop.
    525   1.94    rpaulo 			  *
    526   1.94    rpaulo 			  * XXX: we may not have enough
    527   1.94    rpaulo 			  * information about its scope zone;
    528   1.94    rpaulo 			  * there is no standard API to pass
    529   1.94    rpaulo 			  * the information from the
    530   1.94    rpaulo 			  * application.
    531   1.94    rpaulo 			  */
    532  1.123    dyoung 			 sockaddr_in6_init(&sa, addr, 0, 0, 0);
    533   1.94    rpaulo 			 if ((error = sa6_embedscope(&sa,
    534   1.94    rpaulo 			     ip6_use_defzone)) != 0) {
    535   1.94    rpaulo 				 goto bad;
    536   1.94    rpaulo 			 }
    537   1.94    rpaulo 			 ip6->ip6_dst = sa.sin6_addr;
    538   1.92  christos 			 (void)memmove(&addr[0], &addr[1],
    539   1.94    rpaulo 			     sizeof(struct in6_addr) *
    540   1.94    rpaulo 			     (rh0->ip6r0_segleft - 1));
    541   1.61    itojun 			 addr[rh0->ip6r0_segleft - 1] = finaldst;
    542   1.94    rpaulo 			 /* XXX */
    543   1.94    rpaulo 			 in6_clearscope(addr + rh0->ip6r0_segleft - 1);
    544    1.2    itojun 			 break;
    545    1.2    itojun 		default:	/* is it possible? */
    546    1.2    itojun 			 error = EINVAL;
    547    1.2    itojun 			 goto bad;
    548    1.2    itojun 		}
    549    1.2    itojun 	}
    550    1.2    itojun 
    551    1.2    itojun 	/* Source address validation */
    552    1.2    itojun 	if (IN6_IS_ADDR_UNSPECIFIED(&ip6->ip6_src) &&
    553   1.54    itojun 	    (flags & IPV6_UNSPECSRC) == 0) {
    554    1.2    itojun 		error = EOPNOTSUPP;
    555    1.2    itojun 		ip6stat.ip6s_badscope++;
    556    1.2    itojun 		goto bad;
    557    1.2    itojun 	}
    558    1.2    itojun 	if (IN6_IS_ADDR_MULTICAST(&ip6->ip6_src)) {
    559    1.2    itojun 		error = EOPNOTSUPP;
    560    1.2    itojun 		ip6stat.ip6s_badscope++;
    561    1.2    itojun 		goto bad;
    562    1.2    itojun 	}
    563    1.2    itojun 
    564    1.2    itojun 	ip6stat.ip6s_localout++;
    565    1.2    itojun 
    566    1.2    itojun 	/*
    567    1.2    itojun 	 * Route packet.
    568    1.2    itojun 	 */
    569   1.78    itojun 	/* initialize cached route */
    570  1.113    dyoung 	if (ro == NULL) {
    571    1.2    itojun 		ro = &ip6route;
    572    1.2    itojun 	}
    573    1.2    itojun 	ro_pmtu = ro;
    574    1.2    itojun 	if (opt && opt->ip6po_rthdr)
    575    1.2    itojun 		ro = &opt->ip6po_route;
    576   1.94    rpaulo 
    577   1.94    rpaulo  	/*
    578   1.94    rpaulo 	 * if specified, try to fill in the traffic class field.
    579   1.94    rpaulo 	 * do not override if a non-zero value is already set.
    580   1.94    rpaulo 	 * we check the diffserv field and the ecn field separately.
    581   1.94    rpaulo 	 */
    582   1.94    rpaulo 	if (opt && opt->ip6po_tclass >= 0) {
    583   1.94    rpaulo 		int mask = 0;
    584   1.94    rpaulo 
    585   1.94    rpaulo 		if ((ip6->ip6_flow & htonl(0xfc << 20)) == 0)
    586   1.94    rpaulo 			mask |= 0xfc;
    587   1.94    rpaulo 		if ((ip6->ip6_flow & htonl(0x03 << 20)) == 0)
    588   1.94    rpaulo 			mask |= 0x03;
    589   1.94    rpaulo 		if (mask != 0)
    590   1.94    rpaulo 			ip6->ip6_flow |= htonl((opt->ip6po_tclass & mask) << 20);
    591    1.2    itojun 	}
    592   1.94    rpaulo 
    593   1.94    rpaulo 	/* fill in or override the hop limit field, if necessary. */
    594   1.94    rpaulo 	if (opt && opt->ip6po_hlim != -1)
    595   1.94    rpaulo 		ip6->ip6_hlim = opt->ip6po_hlim & 0xff;
    596   1.94    rpaulo 	else if (IN6_IS_ADDR_MULTICAST(&ip6->ip6_dst)) {
    597   1.94    rpaulo 		if (im6o != NULL)
    598   1.94    rpaulo 			ip6->ip6_hlim = im6o->im6o_multicast_hlim;
    599   1.94    rpaulo 		else
    600   1.94    rpaulo 			ip6->ip6_hlim = ip6_defmcasthlim;
    601    1.2    itojun 	}
    602   1.94    rpaulo 
    603    1.2    itojun #ifdef IPSEC
    604    1.2    itojun 	if (needipsec && needipsectun) {
    605    1.2    itojun 		struct ipsec_output_state state;
    606    1.2    itojun 
    607    1.2    itojun 		/*
    608    1.2    itojun 		 * All the extension headers will become inaccessible
    609    1.2    itojun 		 * (since they can be encrypted).
    610    1.2    itojun 		 * Don't panic, we need no more updates to extension headers
    611    1.2    itojun 		 * on inner IPv6 packet (since they are now encapsulated).
    612    1.2    itojun 		 *
    613    1.2    itojun 		 * IPv6 [ESP|AH] IPv6 [extension headers] payload
    614    1.2    itojun 		 */
    615    1.2    itojun 		bzero(&exthdrs, sizeof(exthdrs));
    616    1.2    itojun 		exthdrs.ip6e_ip6 = m;
    617    1.2    itojun 
    618    1.2    itojun 		bzero(&state, sizeof(state));
    619    1.2    itojun 		state.m = m;
    620  1.118    dyoung 		state.ro = ro;
    621  1.118    dyoung 		state.dst = rtcache_getdst(ro);
    622    1.2    itojun 
    623    1.2    itojun 		error = ipsec6_output_tunnel(&state, sp, flags);
    624    1.2    itojun 
    625    1.2    itojun 		m = state.m;
    626  1.118    dyoung 		ro_pmtu = ro = state.ro;
    627  1.118    dyoung 		dst = satocsin6(state.dst);
    628    1.2    itojun 		if (error) {
    629    1.2    itojun 			/* mbuf is already reclaimed in ipsec6_output_tunnel. */
    630    1.2    itojun 			m0 = m = NULL;
    631    1.2    itojun 			m = NULL;
    632    1.2    itojun 			switch (error) {
    633    1.2    itojun 			case EHOSTUNREACH:
    634    1.2    itojun 			case ENETUNREACH:
    635    1.2    itojun 			case EMSGSIZE:
    636    1.2    itojun 			case ENOBUFS:
    637    1.2    itojun 			case ENOMEM:
    638    1.2    itojun 				break;
    639    1.2    itojun 			default:
    640    1.2    itojun 				printf("ip6_output (ipsec): error code %d\n", error);
    641   1.48    itojun 				/* FALLTHROUGH */
    642    1.2    itojun 			case ENOENT:
    643    1.2    itojun 				/* don't show these error codes to the user */
    644    1.2    itojun 				error = 0;
    645    1.2    itojun 				break;
    646    1.2    itojun 			}
    647    1.2    itojun 			goto bad;
    648    1.2    itojun 		}
    649    1.2    itojun 
    650    1.2    itojun 		exthdrs.ip6e_ip6 = m;
    651    1.2    itojun 	}
    652   1.40    itojun #endif /* IPSEC */
    653  1.114  degroote #ifdef FAST_IPSEC
    654  1.114  degroote 	if (needipsec) {
    655  1.114  degroote 		s = splsoftnet();
    656  1.114  degroote 		error = ipsec6_process_packet(m,sp->req);
    657  1.114  degroote 
    658  1.114  degroote 		/*
    659  1.114  degroote 		 * Preserve KAME behaviour: ENOENT can be returned
    660  1.114  degroote 		 * when an SA acquire is in progress.  Don't propagate
    661  1.114  degroote 		 * this to user-level; it confuses applications.
    662  1.114  degroote 		 * XXX this will go away when the SADB is redone.
    663  1.114  degroote 		 */
    664  1.114  degroote 		if (error == ENOENT)
    665  1.114  degroote 			error = 0;
    666  1.114  degroote 		splx(s);
    667  1.114  degroote 		goto done;
    668  1.118    dyoung 	}
    669  1.114  degroote #endif /* FAST_IPSEC */
    670  1.114  degroote 
    671  1.114  degroote 
    672    1.2    itojun 
    673   1.94    rpaulo 	/* adjust pointer */
    674   1.94    rpaulo 	ip6 = mtod(m, struct ip6_hdr *);
    675    1.2    itojun 
    676  1.123    dyoung 	sockaddr_in6_init(&dst_sa, &ip6->ip6_dst, 0, 0, 0);
    677  1.118    dyoung 	if ((error = in6_selectroute(&dst_sa, opt, im6o, ro,
    678  1.115    dyoung 	    &ifp, &rt, 0)) != 0) {
    679   1.94    rpaulo 		if (ifp != NULL)
    680   1.94    rpaulo 			in6_ifstat_inc(ifp, ifs6_out_discard);
    681   1.94    rpaulo 		goto bad;
    682   1.94    rpaulo 	}
    683   1.94    rpaulo 	if (rt == NULL) {
    684   1.94    rpaulo 		/*
    685   1.94    rpaulo 		 * If in6_selectroute() does not return a route entry,
    686   1.94    rpaulo 		 * dst may not have been updated.
    687   1.94    rpaulo 		 */
    688  1.118    dyoung 		rtcache_setdst(ro, sin6tosa(&dst_sa));
    689   1.94    rpaulo 	}
    690    1.2    itojun 
    691   1.94    rpaulo 	/*
    692   1.94    rpaulo 	 * then rt (for unicast) and ifp must be non-NULL valid values.
    693   1.94    rpaulo 	 */
    694   1.94    rpaulo 	if ((flags & IPV6_FORWARDING) == 0) {
    695   1.94    rpaulo 		/* XXX: the FORWARDING flag can be set for mrouting. */
    696    1.9    itojun 		in6_ifstat_inc(ifp, ifs6_out_request);
    697   1.94    rpaulo 	}
    698   1.94    rpaulo 	if (rt != NULL) {
    699   1.94    rpaulo 		ia = (struct in6_ifaddr *)(rt->rt_ifa);
    700   1.94    rpaulo 		rt->rt_use++;
    701   1.94    rpaulo 	}
    702    1.9    itojun 
    703   1.94    rpaulo 	/*
    704   1.94    rpaulo 	 * The outgoing interface must be in the zone of source and
    705   1.94    rpaulo 	 * destination addresses.  We should use ia_ifp to support the
    706   1.94    rpaulo 	 * case of sending packets to an address of our own.
    707   1.94    rpaulo 	 */
    708   1.94    rpaulo 	if (ia != NULL && ia->ia_ifp)
    709   1.94    rpaulo 		origifp = ia->ia_ifp;
    710   1.94    rpaulo 	else
    711   1.94    rpaulo 		origifp = ifp;
    712    1.2    itojun 
    713   1.94    rpaulo 	src0 = ip6->ip6_src;
    714   1.94    rpaulo 	if (in6_setscope(&src0, origifp, &zone))
    715   1.94    rpaulo 		goto badscope;
    716  1.123    dyoung 	sockaddr_in6_init(&src_sa, &ip6->ip6_src, 0, 0, 0);
    717   1.94    rpaulo 	if (sa6_recoverscope(&src_sa) || zone != src_sa.sin6_scope_id)
    718   1.94    rpaulo 		goto badscope;
    719   1.94    rpaulo 
    720   1.94    rpaulo 	dst0 = ip6->ip6_dst;
    721   1.94    rpaulo 	if (in6_setscope(&dst0, origifp, &zone))
    722   1.94    rpaulo 		goto badscope;
    723   1.94    rpaulo 	/* re-initialize to be sure */
    724  1.123    dyoung 	sockaddr_in6_init(&dst_sa, &ip6->ip6_dst, 0, 0, 0);
    725   1.94    rpaulo 	if (sa6_recoverscope(&dst_sa) || zone != dst_sa.sin6_scope_id)
    726   1.94    rpaulo 		goto badscope;
    727   1.94    rpaulo 
    728   1.94    rpaulo 	/* scope check is done. */
    729   1.94    rpaulo 
    730  1.118    dyoung 	if (rt == NULL || IN6_IS_ADDR_MULTICAST(&ip6->ip6_dst)) {
    731  1.118    dyoung 		if (dst == NULL)
    732  1.118    dyoung 			dst = satocsin6(rtcache_getdst(ro));
    733  1.118    dyoung 		KASSERT(dst != NULL);
    734  1.124    dyoung 	} else if (opt && rtcache_getrt(&opt->ip6po_nextroute) != NULL) {
    735  1.118    dyoung 		/*
    736  1.118    dyoung 		 * The nexthop is explicitly specified by the
    737  1.118    dyoung 		 * application.  We assume the next hop is an IPv6
    738  1.118    dyoung 		 * address.
    739  1.118    dyoung 		 */
    740  1.118    dyoung 		dst = (struct sockaddr_in6 *)opt->ip6po_nexthop;
    741  1.118    dyoung 	} else if ((rt->rt_flags & RTF_GATEWAY))
    742  1.118    dyoung 		dst = (struct sockaddr_in6 *)rt->rt_gateway;
    743  1.118    dyoung 	else if (dst == NULL)
    744  1.118    dyoung 		dst = satocsin6(rtcache_getdst(ro));
    745    1.2    itojun 
    746   1.94    rpaulo 	/*
    747   1.94    rpaulo 	 * XXXXXX: original code follows:
    748   1.94    rpaulo 	 */
    749   1.94    rpaulo 	if (!IN6_IS_ADDR_MULTICAST(&ip6->ip6_dst))
    750   1.94    rpaulo 		m->m_flags &= ~(M_BCAST | M_MCAST);	/* just in case */
    751   1.94    rpaulo 	else {
    752   1.94    rpaulo 		struct	in6_multi *in6m;
    753    1.2    itojun 
    754   1.94    rpaulo 		m->m_flags = (m->m_flags & ~M_BCAST) | M_MCAST;
    755    1.9    itojun 
    756    1.9    itojun 		in6_ifstat_inc(ifp, ifs6_out_mcast);
    757    1.9    itojun 
    758    1.2    itojun 		/*
    759    1.2    itojun 		 * Confirm that the outgoing interface supports multicast.
    760    1.2    itojun 		 */
    761   1.94    rpaulo 		if (!(ifp->if_flags & IFF_MULTICAST)) {
    762    1.2    itojun 			ip6stat.ip6s_noroute++;
    763    1.9    itojun 			in6_ifstat_inc(ifp, ifs6_out_discard);
    764    1.2    itojun 			error = ENETUNREACH;
    765    1.2    itojun 			goto bad;
    766    1.2    itojun 		}
    767   1.94    rpaulo 
    768    1.2    itojun 		IN6_LOOKUP_MULTI(ip6->ip6_dst, ifp, in6m);
    769    1.2    itojun 		if (in6m != NULL &&
    770    1.2    itojun 		   (im6o == NULL || im6o->im6o_multicast_loop)) {
    771    1.2    itojun 			/*
    772    1.2    itojun 			 * If we belong to the destination multicast group
    773    1.2    itojun 			 * on the outgoing interface, and the caller did not
    774    1.2    itojun 			 * forbid loopback, loop back a copy.
    775    1.2    itojun 			 */
    776  1.118    dyoung 			KASSERT(dst != NULL);
    777    1.2    itojun 			ip6_mloopback(ifp, m, dst);
    778    1.2    itojun 		} else {
    779    1.2    itojun 			/*
    780    1.2    itojun 			 * If we are acting as a multicast router, perform
    781    1.2    itojun 			 * multicast forwarding as if the packet had just
    782    1.2    itojun 			 * arrived on the interface to which we are about
    783    1.2    itojun 			 * to send.  The multicast forwarding function
    784    1.2    itojun 			 * recursively calls this function, using the
    785    1.2    itojun 			 * IPV6_FORWARDING flag to prevent infinite recursion.
    786    1.2    itojun 			 *
    787    1.2    itojun 			 * Multicasts that are looped back by ip6_mloopback(),
    788    1.2    itojun 			 * above, will be forwarded by the ip6_input() routine,
    789    1.2    itojun 			 * if necessary.
    790    1.2    itojun 			 */
    791    1.2    itojun 			if (ip6_mrouter && (flags & IPV6_FORWARDING) == 0) {
    792   1.20   thorpej 				if (ip6_mforward(ip6, ifp, m) != 0) {
    793    1.2    itojun 					m_freem(m);
    794    1.2    itojun 					goto done;
    795    1.2    itojun 				}
    796    1.2    itojun 			}
    797    1.2    itojun 		}
    798    1.2    itojun 		/*
    799    1.2    itojun 		 * Multicasts with a hoplimit of zero may be looped back,
    800    1.2    itojun 		 * above, but must not be transmitted on a network.
    801    1.2    itojun 		 * Also, multicasts addressed to the loopback interface
    802    1.2    itojun 		 * are not sent -- the above call to ip6_mloopback() will
    803    1.2    itojun 		 * loop back a copy if this host actually belongs to the
    804    1.2    itojun 		 * destination group on the loopback interface.
    805    1.2    itojun 		 */
    806   1.94    rpaulo 		if (ip6->ip6_hlim == 0 || (ifp->if_flags & IFF_LOOPBACK) ||
    807   1.94    rpaulo 		    IN6_IS_ADDR_MC_INTFACELOCAL(&ip6->ip6_dst)) {
    808    1.2    itojun 			m_freem(m);
    809    1.2    itojun 			goto done;
    810    1.2    itojun 		}
    811    1.2    itojun 	}
    812    1.2    itojun 
    813    1.2    itojun 	/*
    814    1.9    itojun 	 * Fill the outgoing inteface to tell the upper layer
    815    1.9    itojun 	 * to increment per-interface statistics.
    816    1.9    itojun 	 */
    817    1.9    itojun 	if (ifpp)
    818    1.9    itojun 		*ifpp = ifp;
    819    1.9    itojun 
    820   1.45    itojun 	/* Determine path MTU. */
    821   1.78    itojun 	if ((error = ip6_getpmtu(ro_pmtu, ro, ifp, &finaldst, &mtu,
    822   1.78    itojun 	    &alwaysfrag)) != 0)
    823   1.45    itojun 		goto bad;
    824   1.85    itojun #ifdef IPSEC
    825   1.85    itojun 	if (needipsectun)
    826   1.85    itojun 		mtu = IPV6_MMTU;
    827   1.85    itojun #endif
    828   1.45    itojun 
    829    1.9    itojun 	/*
    830   1.45    itojun 	 * The caller of this function may specify to use the minimum MTU
    831   1.45    itojun 	 * in some cases.
    832   1.97    rpaulo 	 * An advanced API option (IPV6_USE_MIN_MTU) can also override MTU
    833   1.97    rpaulo 	 * setting.  The logic is a bit complicated; by default, unicast
    834   1.97    rpaulo 	 * packets will follow path MTU while multicast packets will be sent at
    835   1.97    rpaulo 	 * the minimum MTU.  If IP6PO_MINMTU_ALL is specified, all packets
    836   1.97    rpaulo 	 * including unicast ones will be sent at the minimum MTU.  Multicast
    837   1.97    rpaulo 	 * packets will always be sent at the minimum MTU unless
    838   1.97    rpaulo 	 * IP6PO_MINMTU_DISABLE is explicitly specified.
    839   1.97    rpaulo 	 * See RFC 3542 for more details.
    840    1.2    itojun 	 */
    841   1.45    itojun 	if (mtu > IPV6_MMTU) {
    842   1.45    itojun 		if ((flags & IPV6_MINMTU))
    843   1.45    itojun 			mtu = IPV6_MMTU;
    844   1.97    rpaulo 		else if (opt && opt->ip6po_minmtu == IP6PO_MINMTU_ALL)
    845   1.97    rpaulo 			mtu = IPV6_MMTU;
    846   1.97    rpaulo 		else if (IN6_IS_ADDR_MULTICAST(&ip6->ip6_dst) &&
    847   1.97    rpaulo 			 (opt == NULL ||
    848   1.97    rpaulo 			  opt->ip6po_minmtu != IP6PO_MINMTU_DISABLE)) {
    849   1.97    rpaulo 			mtu = IPV6_MMTU;
    850   1.97    rpaulo 		}
    851   1.43    itojun 	}
    852   1.43    itojun 
    853   1.94    rpaulo 	/*
    854   1.94    rpaulo 	 * clear embedded scope identifiers if necessary.
    855   1.94    rpaulo 	 * in6_clearscope will touch the addresses only when necessary.
    856   1.94    rpaulo 	 */
    857   1.94    rpaulo 	in6_clearscope(&ip6->ip6_src);
    858   1.94    rpaulo 	in6_clearscope(&ip6->ip6_dst);
    859    1.2    itojun 
    860    1.2    itojun 	/*
    861    1.2    itojun 	 * If the outgoing packet contains a hop-by-hop options header,
    862    1.2    itojun 	 * it must be examined and processed even by the source node.
    863    1.2    itojun 	 * (RFC 2460, section 4.)
    864    1.2    itojun 	 */
    865    1.2    itojun 	if (exthdrs.ip6e_hbh) {
    866   1.31    itojun 		struct ip6_hbh *hbh = mtod(exthdrs.ip6e_hbh, struct ip6_hbh *);
    867    1.5    itojun 		u_int32_t dummy1; /* XXX unused */
    868    1.2    itojun 		u_int32_t dummy2; /* XXX unused */
    869    1.2    itojun 
    870    1.2    itojun 		/*
    871    1.2    itojun 		 *  XXX: if we have to send an ICMPv6 error to the sender,
    872    1.2    itojun 		 *       we need the M_LOOP flag since icmp6_error() expects
    873    1.2    itojun 		 *       the IPv6 and the hop-by-hop options header are
    874    1.2    itojun 		 *       continuous unless the flag is set.
    875    1.2    itojun 		 */
    876    1.2    itojun 		m->m_flags |= M_LOOP;
    877    1.2    itojun 		m->m_pkthdr.rcvif = ifp;
    878   1.49    itojun 		if (ip6_process_hopopts(m, (u_int8_t *)(hbh + 1),
    879   1.49    itojun 		    ((hbh->ip6h_len + 1) << 3) - sizeof(struct ip6_hbh),
    880   1.49    itojun 		    &dummy1, &dummy2) < 0) {
    881    1.2    itojun 			/* m was already freed at this point */
    882    1.2    itojun 			error = EINVAL;/* better error? */
    883    1.2    itojun 			goto done;
    884    1.2    itojun 		}
    885    1.2    itojun 		m->m_flags &= ~M_LOOP; /* XXX */
    886    1.2    itojun 		m->m_pkthdr.rcvif = NULL;
    887    1.2    itojun 	}
    888    1.2    itojun 
    889   1.15   darrenr #ifdef PFIL_HOOKS
    890   1.15   darrenr 	/*
    891   1.15   darrenr 	 * Run through list of hooks for output packets.
    892   1.15   darrenr 	 */
    893   1.49    itojun 	if ((error = pfil_run_hooks(&inet6_pfil_hook, &m, ifp, PFIL_OUT)) != 0)
    894   1.27   thorpej 		goto done;
    895   1.27   thorpej 	if (m == NULL)
    896   1.27   thorpej 		goto done;
    897   1.27   thorpej 	ip6 = mtod(m, struct ip6_hdr *);
    898   1.15   darrenr #endif /* PFIL_HOOKS */
    899    1.2    itojun 	/*
    900    1.2    itojun 	 * Send the packet to the outgoing interface.
    901   1.19    itojun 	 * If necessary, do IPv6 fragmentation before sending.
    902   1.78    itojun 	 *
    903   1.78    itojun 	 * the logic here is rather complex:
    904   1.78    itojun 	 * 1: normal case (dontfrag == 0, alwaysfrag == 0)
    905   1.78    itojun 	 * 1-a:	send as is if tlen <= path mtu
    906   1.78    itojun 	 * 1-b:	fragment if tlen > path mtu
    907   1.78    itojun 	 *
    908   1.78    itojun 	 * 2: if user asks us not to fragment (dontfrag == 1)
    909   1.78    itojun 	 * 2-a:	send as is if tlen <= interface mtu
    910   1.78    itojun 	 * 2-b:	error if tlen > interface mtu
    911   1.78    itojun 	 *
    912   1.78    itojun 	 * 3: if we always need to attach fragment header (alwaysfrag == 1)
    913   1.78    itojun 	 *	always fragment
    914   1.78    itojun 	 *
    915   1.78    itojun 	 * 4: if dontfrag == 1 && alwaysfrag == 1
    916   1.78    itojun 	 *	error, as we cannot handle this conflicting request
    917    1.2    itojun 	 */
    918    1.2    itojun 	tlen = m->m_pkthdr.len;
    919  1.105      yamt 	tso = (m->m_pkthdr.csum_flags & M_CSUM_TSOv6) != 0;
    920   1.97    rpaulo 	if (opt && (opt->ip6po_flags & IP6PO_DONTFRAG))
    921   1.97    rpaulo 		dontfrag = 1;
    922   1.97    rpaulo 	else
    923   1.97    rpaulo 		dontfrag = 0;
    924   1.97    rpaulo 
    925   1.78    itojun 	if (dontfrag && alwaysfrag) {	/* case 4 */
    926   1.78    itojun 		/* conflicting request - can't transmit */
    927   1.78    itojun 		error = EMSGSIZE;
    928   1.78    itojun 		goto bad;
    929   1.78    itojun 	}
    930  1.105      yamt 	if (dontfrag && (!tso && tlen > IN6_LINKMTU(ifp))) {	/* case 2-b */
    931   1.78    itojun 		/*
    932   1.78    itojun 		 * Even if the DONTFRAG option is specified, we cannot send the
    933   1.78    itojun 		 * packet when the data length is larger than the MTU of the
    934   1.78    itojun 		 * outgoing interface.
    935   1.78    itojun 		 * Notify the error by sending IPV6_PATHMTU ancillary data as
    936   1.78    itojun 		 * well as returning an error code (the latter is not described
    937   1.78    itojun 		 * in the API spec.)
    938   1.78    itojun 		 */
    939   1.78    itojun 		u_int32_t mtu32;
    940   1.78    itojun 		struct ip6ctlparam ip6cp;
    941   1.78    itojun 
    942   1.78    itojun 		mtu32 = (u_int32_t)mtu;
    943   1.78    itojun 		bzero(&ip6cp, sizeof(ip6cp));
    944   1.78    itojun 		ip6cp.ip6c_cmdarg = (void *)&mtu32;
    945  1.115    dyoung 		pfctlinput2(PRC_MSGSIZE,
    946  1.118    dyoung 		    rtcache_getdst(ro_pmtu), &ip6cp);
    947   1.78    itojun 
    948   1.78    itojun 		error = EMSGSIZE;
    949   1.78    itojun 		goto bad;
    950   1.78    itojun 	}
    951   1.97    rpaulo 
    952   1.78    itojun 	/*
    953   1.78    itojun 	 * transmit packet without fragmentation
    954   1.78    itojun 	 */
    955  1.105      yamt 	if (dontfrag || (!alwaysfrag && (tlen <= mtu || tso))) {
    956  1.105      yamt 		/* case 1-a and 2-a */
    957   1.26    itojun 		struct in6_ifaddr *ia6;
    958   1.89      yamt 		int sw_csum;
    959   1.78    itojun 
    960   1.26    itojun 		ip6 = mtod(m, struct ip6_hdr *);
    961   1.26    itojun 		ia6 = in6_ifawithifp(ifp, &ip6->ip6_src);
    962   1.26    itojun 		if (ia6) {
    963   1.42    itojun 			/* Record statistics for this interface address. */
    964   1.78    itojun 			ia6->ia_ifa.ifa_data.ifad_outbytes += m->m_pkthdr.len;
    965    1.9    itojun 		}
    966   1.28    itojun #ifdef IPSEC
    967   1.28    itojun 		/* clean ipsec history once it goes out of the node */
    968   1.28    itojun 		ipsec_delaux(m);
    969   1.28    itojun #endif
    970   1.89      yamt 
    971   1.89      yamt 		sw_csum = m->m_pkthdr.csum_flags & ~ifp->if_csum_flags_tx;
    972   1.89      yamt 		if ((sw_csum & (M_CSUM_UDPv6|M_CSUM_TCPv6)) != 0) {
    973   1.90      yamt 			if (IN6_NEED_CHECKSUM(ifp,
    974   1.90      yamt 			    sw_csum & (M_CSUM_UDPv6|M_CSUM_TCPv6))) {
    975   1.90      yamt 				in6_delayed_cksum(m);
    976   1.90      yamt 			}
    977   1.89      yamt 			m->m_pkthdr.csum_flags &= ~(M_CSUM_UDPv6|M_CSUM_TCPv6);
    978   1.89      yamt 		}
    979   1.89      yamt 
    980  1.118    dyoung 		KASSERT(dst != NULL);
    981  1.105      yamt 		if (__predict_true(!tso ||
    982  1.105      yamt 		    (ifp->if_capenable & IFCAP_TSOv6) != 0)) {
    983  1.105      yamt 			error = nd6_output(ifp, origifp, m, dst, rt);
    984  1.105      yamt 		} else {
    985  1.105      yamt 			error = ip6_tso_output(ifp, origifp, m, dst, rt);
    986  1.105      yamt 		}
    987    1.2    itojun 		goto done;
    988   1.78    itojun 	}
    989   1.78    itojun 
    990  1.105      yamt 	if (tso) {
    991  1.105      yamt 		error = EINVAL; /* XXX */
    992  1.105      yamt 		goto bad;
    993  1.105      yamt 	}
    994  1.105      yamt 
    995   1.78    itojun 	/*
    996   1.78    itojun 	 * try to fragment the packet.  case 1-b and 3
    997   1.78    itojun 	 */
    998   1.78    itojun 	if (mtu < IPV6_MMTU) {
    999   1.78    itojun 		/* path MTU cannot be less than IPV6_MMTU */
   1000    1.2    itojun 		error = EMSGSIZE;
   1001    1.9    itojun 		in6_ifstat_inc(ifp, ifs6_out_fragfail);
   1002    1.2    itojun 		goto bad;
   1003   1.78    itojun 	} else if (ip6->ip6_plen == 0) {
   1004   1.78    itojun 		/* jumbo payload cannot be fragmented */
   1005    1.2    itojun 		error = EMSGSIZE;
   1006    1.9    itojun 		in6_ifstat_inc(ifp, ifs6_out_fragfail);
   1007    1.2    itojun 		goto bad;
   1008    1.2    itojun 	} else {
   1009    1.2    itojun 		struct mbuf **mnext, *m_frgpart;
   1010    1.2    itojun 		struct ip6_frag *ip6f;
   1011   1.70    itojun 		u_int32_t id = htonl(ip6_randomid());
   1012    1.2    itojun 		u_char nextproto;
   1013   1.99    rpaulo #if 0				/* see below */
   1014   1.78    itojun 		struct ip6ctlparam ip6cp;
   1015   1.78    itojun 		u_int32_t mtu32;
   1016   1.99    rpaulo #endif
   1017    1.2    itojun 
   1018    1.2    itojun 		/*
   1019    1.2    itojun 		 * Too large for the destination or interface;
   1020    1.2    itojun 		 * fragment if possible.
   1021    1.2    itojun 		 * Must be able to put at least 8 bytes per fragment.
   1022    1.2    itojun 		 */
   1023    1.2    itojun 		hlen = unfragpartlen;
   1024    1.2    itojun 		if (mtu > IPV6_MAXPACKET)
   1025    1.2    itojun 			mtu = IPV6_MAXPACKET;
   1026   1.78    itojun 
   1027   1.99    rpaulo #if 0
   1028   1.99    rpaulo 		/*
   1029   1.99    rpaulo 		 * It is believed this code is a leftover from the
   1030   1.99    rpaulo 		 * development of the IPV6_RECVPATHMTU sockopt and
   1031   1.99    rpaulo 		 * associated work to implement RFC3542.
   1032   1.99    rpaulo 		 * It's not entirely clear what the intent of the API
   1033   1.99    rpaulo 		 * is at this point, so disable this code for now.
   1034   1.99    rpaulo 		 * The IPV6_RECVPATHMTU sockopt and/or IPV6_DONTFRAG
   1035   1.99    rpaulo 		 * will send notifications if the application requests.
   1036   1.99    rpaulo 		 */
   1037   1.99    rpaulo 
   1038   1.78    itojun 		/* Notify a proper path MTU to applications. */
   1039   1.78    itojun 		mtu32 = (u_int32_t)mtu;
   1040   1.78    itojun 		bzero(&ip6cp, sizeof(ip6cp));
   1041   1.78    itojun 		ip6cp.ip6c_cmdarg = (void *)&mtu32;
   1042  1.115    dyoung 		pfctlinput2(PRC_MSGSIZE,
   1043  1.118    dyoung 		    rtcache_getdst(ro_pmtu), &ip6cp);
   1044   1.99    rpaulo #endif
   1045   1.78    itojun 
   1046    1.2    itojun 		len = (mtu - hlen - sizeof(struct ip6_frag)) & ~7;
   1047    1.2    itojun 		if (len < 8) {
   1048    1.2    itojun 			error = EMSGSIZE;
   1049    1.9    itojun 			in6_ifstat_inc(ifp, ifs6_out_fragfail);
   1050    1.2    itojun 			goto bad;
   1051    1.2    itojun 		}
   1052    1.2    itojun 
   1053    1.2    itojun 		mnext = &m->m_nextpkt;
   1054    1.2    itojun 
   1055    1.2    itojun 		/*
   1056    1.2    itojun 		 * Change the next header field of the last header in the
   1057    1.2    itojun 		 * unfragmentable part.
   1058    1.2    itojun 		 */
   1059    1.2    itojun 		if (exthdrs.ip6e_rthdr) {
   1060    1.2    itojun 			nextproto = *mtod(exthdrs.ip6e_rthdr, u_char *);
   1061    1.2    itojun 			*mtod(exthdrs.ip6e_rthdr, u_char *) = IPPROTO_FRAGMENT;
   1062   1.19    itojun 		} else if (exthdrs.ip6e_dest1) {
   1063    1.2    itojun 			nextproto = *mtod(exthdrs.ip6e_dest1, u_char *);
   1064    1.2    itojun 			*mtod(exthdrs.ip6e_dest1, u_char *) = IPPROTO_FRAGMENT;
   1065   1.19    itojun 		} else if (exthdrs.ip6e_hbh) {
   1066    1.2    itojun 			nextproto = *mtod(exthdrs.ip6e_hbh, u_char *);
   1067    1.2    itojun 			*mtod(exthdrs.ip6e_hbh, u_char *) = IPPROTO_FRAGMENT;
   1068   1.19    itojun 		} else {
   1069    1.2    itojun 			nextproto = ip6->ip6_nxt;
   1070    1.2    itojun 			ip6->ip6_nxt = IPPROTO_FRAGMENT;
   1071    1.2    itojun 		}
   1072    1.2    itojun 
   1073   1.89      yamt 		if ((m->m_pkthdr.csum_flags & (M_CSUM_UDPv6|M_CSUM_TCPv6))
   1074   1.89      yamt 		    != 0) {
   1075   1.90      yamt 			if (IN6_NEED_CHECKSUM(ifp,
   1076   1.90      yamt 			    m->m_pkthdr.csum_flags &
   1077   1.90      yamt 			    (M_CSUM_UDPv6|M_CSUM_TCPv6))) {
   1078   1.90      yamt 				in6_delayed_cksum(m);
   1079   1.90      yamt 			}
   1080   1.89      yamt 			m->m_pkthdr.csum_flags &= ~(M_CSUM_UDPv6|M_CSUM_TCPv6);
   1081   1.89      yamt 		}
   1082   1.89      yamt 
   1083    1.2    itojun 		/*
   1084    1.2    itojun 		 * Loop through length of segment after first fragment,
   1085   1.42    itojun 		 * make new header and copy data of each part and link onto
   1086   1.42    itojun 		 * chain.
   1087    1.2    itojun 		 */
   1088    1.2    itojun 		m0 = m;
   1089    1.2    itojun 		for (off = hlen; off < tlen; off += len) {
   1090   1.68    itojun 			struct mbuf *mlast;
   1091   1.68    itojun 
   1092    1.2    itojun 			MGETHDR(m, M_DONTWAIT, MT_HEADER);
   1093    1.2    itojun 			if (!m) {
   1094    1.2    itojun 				error = ENOBUFS;
   1095    1.2    itojun 				ip6stat.ip6s_odropped++;
   1096    1.2    itojun 				goto sendorfree;
   1097    1.2    itojun 			}
   1098   1.78    itojun 			m->m_pkthdr.rcvif = NULL;
   1099    1.2    itojun 			m->m_flags = m0->m_flags & M_COPYFLAGS;
   1100    1.2    itojun 			*mnext = m;
   1101    1.2    itojun 			mnext = &m->m_nextpkt;
   1102    1.2    itojun 			m->m_data += max_linkhdr;
   1103    1.2    itojun 			mhip6 = mtod(m, struct ip6_hdr *);
   1104    1.2    itojun 			*mhip6 = *ip6;
   1105    1.2    itojun 			m->m_len = sizeof(*mhip6);
   1106   1.42    itojun 			error = ip6_insertfraghdr(m0, m, hlen, &ip6f);
   1107   1.42    itojun 			if (error) {
   1108    1.2    itojun 				ip6stat.ip6s_odropped++;
   1109    1.2    itojun 				goto sendorfree;
   1110    1.2    itojun 			}
   1111   1.69    itojun 			ip6f->ip6f_offlg = htons((u_int16_t)((off - hlen) & ~7));
   1112    1.2    itojun 			if (off + len >= tlen)
   1113    1.2    itojun 				len = tlen - off;
   1114    1.2    itojun 			else
   1115    1.2    itojun 				ip6f->ip6f_offlg |= IP6F_MORE_FRAG;
   1116   1.69    itojun 			mhip6->ip6_plen = htons((u_int16_t)(len + hlen +
   1117   1.49    itojun 			    sizeof(*ip6f) - sizeof(struct ip6_hdr)));
   1118    1.2    itojun 			if ((m_frgpart = m_copy(m0, off, len)) == 0) {
   1119    1.2    itojun 				error = ENOBUFS;
   1120    1.2    itojun 				ip6stat.ip6s_odropped++;
   1121    1.2    itojun 				goto sendorfree;
   1122    1.2    itojun 			}
   1123   1.68    itojun 			for (mlast = m; mlast->m_next; mlast = mlast->m_next)
   1124   1.68    itojun 				;
   1125   1.68    itojun 			mlast->m_next = m_frgpart;
   1126    1.2    itojun 			m->m_pkthdr.len = len + hlen + sizeof(*ip6f);
   1127    1.2    itojun 			m->m_pkthdr.rcvif = (struct ifnet *)0;
   1128    1.2    itojun 			ip6f->ip6f_reserved = 0;
   1129    1.2    itojun 			ip6f->ip6f_ident = id;
   1130    1.2    itojun 			ip6f->ip6f_nxt = nextproto;
   1131    1.2    itojun 			ip6stat.ip6s_ofragments++;
   1132    1.9    itojun 			in6_ifstat_inc(ifp, ifs6_out_fragcreat);
   1133    1.2    itojun 		}
   1134    1.9    itojun 
   1135    1.9    itojun 		in6_ifstat_inc(ifp, ifs6_out_fragok);
   1136    1.2    itojun 	}
   1137    1.2    itojun 
   1138    1.2    itojun 	/*
   1139    1.2    itojun 	 * Remove leading garbages.
   1140    1.2    itojun 	 */
   1141    1.2    itojun sendorfree:
   1142    1.2    itojun 	m = m0->m_nextpkt;
   1143    1.2    itojun 	m0->m_nextpkt = 0;
   1144    1.2    itojun 	m_freem(m0);
   1145    1.2    itojun 	for (m0 = m; m; m = m0) {
   1146    1.2    itojun 		m0 = m->m_nextpkt;
   1147    1.2    itojun 		m->m_nextpkt = 0;
   1148    1.2    itojun 		if (error == 0) {
   1149   1.26    itojun 			struct in6_ifaddr *ia6;
   1150   1.26    itojun 			ip6 = mtod(m, struct ip6_hdr *);
   1151   1.26    itojun 			ia6 = in6_ifawithifp(ifp, &ip6->ip6_src);
   1152   1.26    itojun 			if (ia6) {
   1153   1.42    itojun 				/*
   1154   1.42    itojun 				 * Record statistics for this interface
   1155   1.42    itojun 				 * address.
   1156   1.42    itojun 				 */
   1157   1.26    itojun 				ia6->ia_ifa.ifa_data.ifad_outbytes +=
   1158   1.78    itojun 				    m->m_pkthdr.len;
   1159    1.9    itojun 			}
   1160   1.28    itojun #ifdef IPSEC
   1161   1.28    itojun 			/* clean ipsec history once it goes out of the node */
   1162   1.28    itojun 			ipsec_delaux(m);
   1163    1.9    itojun #endif
   1164  1.118    dyoung 			KASSERT(dst != NULL);
   1165   1.97    rpaulo 			error = nd6_output(ifp, origifp, m, dst, rt);
   1166   1.19    itojun 		} else
   1167    1.2    itojun 			m_freem(m);
   1168    1.2    itojun 	}
   1169    1.2    itojun 
   1170    1.2    itojun 	if (error == 0)
   1171    1.2    itojun 		ip6stat.ip6s_fragmented++;
   1172    1.2    itojun 
   1173    1.2    itojun done:
   1174  1.124    dyoung 	rtcache_free(&ip6route);
   1175    1.2    itojun 
   1176    1.2    itojun #ifdef IPSEC
   1177    1.2    itojun 	if (sp != NULL)
   1178    1.2    itojun 		key_freesp(sp);
   1179    1.2    itojun #endif /* IPSEC */
   1180  1.114  degroote #ifdef FAST_IPSEC
   1181  1.114  degroote 	if (sp != NULL)
   1182  1.114  degroote 		KEY_FREESP(&sp);
   1183  1.114  degroote #endif /* FAST_IPSEC */
   1184  1.114  degroote 
   1185    1.2    itojun 
   1186   1.57    itojun 	return (error);
   1187    1.2    itojun 
   1188    1.2    itojun freehdrs:
   1189    1.2    itojun 	m_freem(exthdrs.ip6e_hbh);	/* m_freem will check if mbuf is 0 */
   1190    1.2    itojun 	m_freem(exthdrs.ip6e_dest1);
   1191    1.2    itojun 	m_freem(exthdrs.ip6e_rthdr);
   1192    1.2    itojun 	m_freem(exthdrs.ip6e_dest2);
   1193   1.48    itojun 	/* FALLTHROUGH */
   1194    1.2    itojun bad:
   1195    1.2    itojun 	m_freem(m);
   1196    1.2    itojun 	goto done;
   1197  1.118    dyoung badscope:
   1198  1.118    dyoung 	ip6stat.ip6s_badscope++;
   1199  1.118    dyoung 	in6_ifstat_inc(origifp, ifs6_out_discard);
   1200  1.118    dyoung 	if (error == 0)
   1201  1.118    dyoung 		error = EHOSTUNREACH; /* XXX */
   1202  1.118    dyoung 	goto bad;
   1203    1.2    itojun }
   1204    1.2    itojun 
   1205    1.2    itojun static int
   1206  1.119  christos ip6_copyexthdr(struct mbuf **mp, void *hdr, int hlen)
   1207    1.2    itojun {
   1208    1.2    itojun 	struct mbuf *m;
   1209    1.2    itojun 
   1210    1.2    itojun 	if (hlen > MCLBYTES)
   1211   1.57    itojun 		return (ENOBUFS); /* XXX */
   1212    1.2    itojun 
   1213    1.2    itojun 	MGET(m, M_DONTWAIT, MT_DATA);
   1214    1.2    itojun 	if (!m)
   1215   1.57    itojun 		return (ENOBUFS);
   1216    1.2    itojun 
   1217    1.2    itojun 	if (hlen > MLEN) {
   1218    1.2    itojun 		MCLGET(m, M_DONTWAIT);
   1219    1.2    itojun 		if ((m->m_flags & M_EXT) == 0) {
   1220    1.2    itojun 			m_free(m);
   1221   1.57    itojun 			return (ENOBUFS);
   1222    1.2    itojun 		}
   1223    1.2    itojun 	}
   1224    1.2    itojun 	m->m_len = hlen;
   1225    1.2    itojun 	if (hdr)
   1226  1.117  christos 		bcopy(hdr, mtod(m, void *), hlen);
   1227    1.2    itojun 
   1228    1.2    itojun 	*mp = m;
   1229   1.57    itojun 	return (0);
   1230    1.2    itojun }
   1231    1.2    itojun 
   1232    1.2    itojun /*
   1233   1.89      yamt  * Process a delayed payload checksum calculation.
   1234   1.89      yamt  */
   1235   1.89      yamt void
   1236   1.89      yamt in6_delayed_cksum(struct mbuf *m)
   1237   1.89      yamt {
   1238   1.89      yamt 	uint16_t csum, offset;
   1239   1.89      yamt 
   1240   1.89      yamt 	KASSERT((m->m_pkthdr.csum_flags & (M_CSUM_UDPv6|M_CSUM_TCPv6)) != 0);
   1241   1.89      yamt 	KASSERT((~m->m_pkthdr.csum_flags & (M_CSUM_UDPv6|M_CSUM_TCPv6)) != 0);
   1242   1.89      yamt 	KASSERT((m->m_pkthdr.csum_flags
   1243   1.89      yamt 	    & (M_CSUM_UDPv4|M_CSUM_TCPv4|M_CSUM_TSOv4)) == 0);
   1244   1.89      yamt 
   1245   1.89      yamt 	offset = M_CSUM_DATA_IPv6_HL(m->m_pkthdr.csum_data);
   1246   1.89      yamt 	csum = in6_cksum(m, 0, offset, m->m_pkthdr.len - offset);
   1247   1.89      yamt 	if (csum == 0 && (m->m_pkthdr.csum_flags & M_CSUM_UDPv6) != 0) {
   1248   1.89      yamt 		csum = 0xffff;
   1249   1.89      yamt 	}
   1250   1.89      yamt 
   1251   1.89      yamt 	offset += M_CSUM_DATA_IPv6_OFFSET(m->m_pkthdr.csum_data);
   1252   1.89      yamt 	if ((offset + sizeof(csum)) > m->m_len) {
   1253   1.89      yamt 		m_copyback(m, offset, sizeof(csum), &csum);
   1254   1.89      yamt 	} else {
   1255  1.117  christos 		*(uint16_t *)(mtod(m, char *) + offset) = csum;
   1256   1.89      yamt 	}
   1257   1.89      yamt }
   1258   1.89      yamt 
   1259   1.89      yamt /*
   1260   1.19    itojun  * Insert jumbo payload option.
   1261    1.2    itojun  */
   1262    1.2    itojun static int
   1263  1.119  christos ip6_insert_jumboopt(struct ip6_exthdrs *exthdrs, u_int32_t plen)
   1264    1.2    itojun {
   1265    1.2    itojun 	struct mbuf *mopt;
   1266   1.56    itojun 	u_int8_t *optbuf;
   1267   1.25    itojun 	u_int32_t v;
   1268    1.2    itojun 
   1269    1.2    itojun #define JUMBOOPTLEN	8	/* length of jumbo payload option and padding */
   1270    1.2    itojun 
   1271    1.2    itojun 	/*
   1272    1.2    itojun 	 * If there is no hop-by-hop options header, allocate new one.
   1273    1.2    itojun 	 * If there is one but it doesn't have enough space to store the
   1274    1.2    itojun 	 * jumbo payload option, allocate a cluster to store the whole options.
   1275    1.2    itojun 	 * Otherwise, use it to store the options.
   1276    1.2    itojun 	 */
   1277    1.2    itojun 	if (exthdrs->ip6e_hbh == 0) {
   1278    1.2    itojun 		MGET(mopt, M_DONTWAIT, MT_DATA);
   1279    1.2    itojun 		if (mopt == 0)
   1280   1.57    itojun 			return (ENOBUFS);
   1281    1.2    itojun 		mopt->m_len = JUMBOOPTLEN;
   1282   1.56    itojun 		optbuf = mtod(mopt, u_int8_t *);
   1283    1.2    itojun 		optbuf[1] = 0;	/* = ((JUMBOOPTLEN) >> 3) - 1 */
   1284    1.2    itojun 		exthdrs->ip6e_hbh = mopt;
   1285   1.19    itojun 	} else {
   1286    1.2    itojun 		struct ip6_hbh *hbh;
   1287    1.2    itojun 
   1288    1.2    itojun 		mopt = exthdrs->ip6e_hbh;
   1289    1.2    itojun 		if (M_TRAILINGSPACE(mopt) < JUMBOOPTLEN) {
   1290   1.25    itojun 			/*
   1291   1.25    itojun 			 * XXX assumption:
   1292   1.25    itojun 			 * - exthdrs->ip6e_hbh is not referenced from places
   1293   1.25    itojun 			 *   other than exthdrs.
   1294   1.25    itojun 			 * - exthdrs->ip6e_hbh is not an mbuf chain.
   1295   1.25    itojun 			 */
   1296    1.2    itojun 			int oldoptlen = mopt->m_len;
   1297   1.25    itojun 			struct mbuf *n;
   1298    1.2    itojun 
   1299   1.25    itojun 			/*
   1300   1.25    itojun 			 * XXX: give up if the whole (new) hbh header does
   1301   1.25    itojun 			 * not fit even in an mbuf cluster.
   1302   1.25    itojun 			 */
   1303   1.25    itojun 			if (oldoptlen + JUMBOOPTLEN > MCLBYTES)
   1304   1.57    itojun 				return (ENOBUFS);
   1305    1.2    itojun 
   1306   1.25    itojun 			/*
   1307   1.25    itojun 			 * As a consequence, we must always prepare a cluster
   1308   1.25    itojun 			 * at this point.
   1309   1.25    itojun 			 */
   1310   1.25    itojun 			MGET(n, M_DONTWAIT, MT_DATA);
   1311   1.25    itojun 			if (n) {
   1312   1.25    itojun 				MCLGET(n, M_DONTWAIT);
   1313   1.25    itojun 				if ((n->m_flags & M_EXT) == 0) {
   1314   1.25    itojun 					m_freem(n);
   1315   1.25    itojun 					n = NULL;
   1316   1.25    itojun 				}
   1317   1.25    itojun 			}
   1318   1.25    itojun 			if (!n)
   1319   1.57    itojun 				return (ENOBUFS);
   1320   1.25    itojun 			n->m_len = oldoptlen + JUMBOOPTLEN;
   1321  1.117  christos 			bcopy(mtod(mopt, void *), mtod(n, void *),
   1322   1.78    itojun 			    oldoptlen);
   1323   1.56    itojun 			optbuf = mtod(n, u_int8_t *) + oldoptlen;
   1324   1.25    itojun 			m_freem(mopt);
   1325   1.33    itojun 			mopt = exthdrs->ip6e_hbh = n;
   1326   1.19    itojun 		} else {
   1327   1.56    itojun 			optbuf = mtod(mopt, u_int8_t *) + mopt->m_len;
   1328    1.2    itojun 			mopt->m_len += JUMBOOPTLEN;
   1329    1.2    itojun 		}
   1330    1.2    itojun 		optbuf[0] = IP6OPT_PADN;
   1331   1.58    itojun 		optbuf[1] = 0;
   1332    1.2    itojun 
   1333    1.2    itojun 		/*
   1334    1.2    itojun 		 * Adjust the header length according to the pad and
   1335    1.2    itojun 		 * the jumbo payload option.
   1336    1.2    itojun 		 */
   1337    1.2    itojun 		hbh = mtod(mopt, struct ip6_hbh *);
   1338    1.2    itojun 		hbh->ip6h_len += (JUMBOOPTLEN >> 3);
   1339    1.2    itojun 	}
   1340    1.2    itojun 
   1341    1.2    itojun 	/* fill in the option. */
   1342    1.2    itojun 	optbuf[2] = IP6OPT_JUMBO;
   1343    1.2    itojun 	optbuf[3] = 4;
   1344   1.25    itojun 	v = (u_int32_t)htonl(plen + JUMBOOPTLEN);
   1345   1.25    itojun 	bcopy(&v, &optbuf[4], sizeof(u_int32_t));
   1346    1.2    itojun 
   1347    1.2    itojun 	/* finally, adjust the packet header length */
   1348    1.2    itojun 	exthdrs->ip6e_ip6->m_pkthdr.len += JUMBOOPTLEN;
   1349    1.2    itojun 
   1350   1.57    itojun 	return (0);
   1351    1.2    itojun #undef JUMBOOPTLEN
   1352    1.2    itojun }
   1353    1.2    itojun 
   1354    1.2    itojun /*
   1355    1.2    itojun  * Insert fragment header and copy unfragmentable header portions.
   1356    1.2    itojun  */
   1357    1.2    itojun static int
   1358  1.119  christos ip6_insertfraghdr(struct mbuf *m0, struct mbuf *m, int hlen,
   1359  1.119  christos 	struct ip6_frag **frghdrp)
   1360    1.2    itojun {
   1361    1.2    itojun 	struct mbuf *n, *mlast;
   1362    1.2    itojun 
   1363    1.2    itojun 	if (hlen > sizeof(struct ip6_hdr)) {
   1364    1.2    itojun 		n = m_copym(m0, sizeof(struct ip6_hdr),
   1365   1.49    itojun 		    hlen - sizeof(struct ip6_hdr), M_DONTWAIT);
   1366    1.2    itojun 		if (n == 0)
   1367   1.57    itojun 			return (ENOBUFS);
   1368    1.2    itojun 		m->m_next = n;
   1369   1.19    itojun 	} else
   1370    1.2    itojun 		n = m;
   1371    1.2    itojun 
   1372    1.2    itojun 	/* Search for the last mbuf of unfragmentable part. */
   1373    1.2    itojun 	for (mlast = n; mlast->m_next; mlast = mlast->m_next)
   1374    1.2    itojun 		;
   1375    1.2    itojun 
   1376    1.2    itojun 	if ((mlast->m_flags & M_EXT) == 0 &&
   1377   1.22    itojun 	    M_TRAILINGSPACE(mlast) >= sizeof(struct ip6_frag)) {
   1378    1.2    itojun 		/* use the trailing space of the last mbuf for the fragment hdr */
   1379  1.117  christos 		*frghdrp = (struct ip6_frag *)(mtod(mlast, char *) +
   1380   1.49    itojun 		    mlast->m_len);
   1381    1.2    itojun 		mlast->m_len += sizeof(struct ip6_frag);
   1382    1.2    itojun 		m->m_pkthdr.len += sizeof(struct ip6_frag);
   1383   1.19    itojun 	} else {
   1384    1.2    itojun 		/* allocate a new mbuf for the fragment header */
   1385    1.2    itojun 		struct mbuf *mfrg;
   1386    1.2    itojun 
   1387    1.2    itojun 		MGET(mfrg, M_DONTWAIT, MT_DATA);
   1388    1.2    itojun 		if (mfrg == 0)
   1389   1.57    itojun 			return (ENOBUFS);
   1390    1.2    itojun 		mfrg->m_len = sizeof(struct ip6_frag);
   1391    1.2    itojun 		*frghdrp = mtod(mfrg, struct ip6_frag *);
   1392    1.2    itojun 		mlast->m_next = mfrg;
   1393    1.2    itojun 	}
   1394    1.2    itojun 
   1395   1.57    itojun 	return (0);
   1396   1.45    itojun }
   1397   1.45    itojun 
   1398   1.88    itojun static int
   1399  1.118    dyoung ip6_getpmtu(struct route *ro_pmtu, struct route *ro, struct ifnet *ifp,
   1400  1.115    dyoung     const struct in6_addr *dst, u_long *mtup, int *alwaysfragp)
   1401   1.45    itojun {
   1402  1.124    dyoung 	struct rtentry *rt;
   1403   1.45    itojun 	u_int32_t mtu = 0;
   1404   1.78    itojun 	int alwaysfrag = 0;
   1405   1.45    itojun 	int error = 0;
   1406   1.45    itojun 
   1407   1.45    itojun 	if (ro_pmtu != ro) {
   1408  1.118    dyoung 		union {
   1409  1.118    dyoung 			struct sockaddr		dst;
   1410  1.118    dyoung 			struct sockaddr_in6	dst6;
   1411  1.118    dyoung 		} u;
   1412  1.118    dyoung 
   1413   1.45    itojun 		/* The first hop and the final destination may differ. */
   1414  1.118    dyoung 		sockaddr_in6_init(&u.dst6, dst, 0, 0, 0);
   1415  1.118    dyoung 		rtcache_lookup(ro_pmtu, &u.dst);
   1416   1.45    itojun 	}
   1417  1.124    dyoung 	if ((rt = rtcache_getrt(ro_pmtu)) != NULL) {
   1418   1.45    itojun 		u_int32_t ifmtu;
   1419   1.45    itojun 
   1420   1.45    itojun 		if (ifp == NULL)
   1421  1.124    dyoung 			ifp = rt->rt_ifp;
   1422   1.45    itojun 		ifmtu = IN6_LINKMTU(ifp);
   1423  1.124    dyoung 		mtu = rt->rt_rmx.rmx_mtu;
   1424   1.46    itojun 		if (mtu == 0)
   1425   1.46    itojun 			mtu = ifmtu;
   1426   1.78    itojun 		else if (mtu < IPV6_MMTU) {
   1427   1.78    itojun 			/*
   1428   1.78    itojun 			 * RFC2460 section 5, last paragraph:
   1429   1.78    itojun 			 * if we record ICMPv6 too big message with
   1430   1.78    itojun 			 * mtu < IPV6_MMTU, transmit packets sized IPV6_MMTU
   1431   1.78    itojun 			 * or smaller, with fragment header attached.
   1432   1.78    itojun 			 * (fragment header is needed regardless from the
   1433   1.78    itojun 			 * packet size, for translators to identify packets)
   1434   1.78    itojun 			 */
   1435   1.78    itojun 			alwaysfrag = 1;
   1436   1.78    itojun 			mtu = IPV6_MMTU;
   1437   1.78    itojun 		} else if (mtu > ifmtu) {
   1438   1.45    itojun 			/*
   1439   1.45    itojun 			 * The MTU on the route is larger than the MTU on
   1440   1.45    itojun 			 * the interface!  This shouldn't happen, unless the
   1441   1.45    itojun 			 * MTU of the interface has been changed after the
   1442   1.45    itojun 			 * interface was brought up.  Change the MTU in the
   1443   1.45    itojun 			 * route to match the interface MTU (as long as the
   1444   1.45    itojun 			 * field isn't locked).
   1445   1.45    itojun 			 */
   1446   1.45    itojun 			mtu = ifmtu;
   1447  1.124    dyoung 			if (!(rt->rt_rmx.rmx_locks & RTV_MTU))
   1448  1.124    dyoung 				rt->rt_rmx.rmx_mtu = mtu;
   1449   1.45    itojun 		}
   1450   1.45    itojun 	} else if (ifp) {
   1451   1.45    itojun 		mtu = IN6_LINKMTU(ifp);
   1452   1.45    itojun 	} else
   1453   1.45    itojun 		error = EHOSTUNREACH; /* XXX */
   1454   1.45    itojun 
   1455   1.45    itojun 	*mtup = mtu;
   1456   1.78    itojun 	if (alwaysfragp)
   1457   1.78    itojun 		*alwaysfragp = alwaysfrag;
   1458   1.57    itojun 	return (error);
   1459    1.2    itojun }
   1460    1.2    itojun 
   1461    1.2    itojun /*
   1462    1.2    itojun  * IP6 socket option processing.
   1463    1.2    itojun  */
   1464    1.2    itojun int
   1465  1.115    dyoung ip6_ctloutput(int op, struct socket *so, int level, int optname,
   1466  1.115    dyoung     struct mbuf **mp)
   1467    1.2    itojun {
   1468   1.97    rpaulo 	int privileged, optdatalen, uproto;
   1469   1.97    rpaulo 	void *optdata;
   1470   1.31    itojun 	struct in6pcb *in6p = sotoin6pcb(so);
   1471   1.31    itojun 	struct mbuf *m = *mp;
   1472   1.97    rpaulo 	int error, optval;
   1473   1.97    rpaulo 	int optlen;
   1474  1.101        ad 	struct lwp *l = curlwp;	/* XXX */
   1475    1.2    itojun 
   1476   1.97    rpaulo 	optlen = m ? m->m_len : 0;
   1477   1.97    rpaulo 	error = optval = 0;
   1478  1.101        ad 	privileged = (l == 0 || kauth_authorize_generic(l->l_cred,
   1479  1.111      elad 	    KAUTH_GENERIC_ISSUSER, NULL)) ? 0 : 1;
   1480   1.97    rpaulo 	uproto = (int)so->so_proto->pr_protocol;
   1481   1.97    rpaulo 
   1482  1.121    dyoung 	if (level != IPPROTO_IPV6) {
   1483  1.121    dyoung 		if (op == PRCO_SETOPT && *mp)
   1484  1.121    dyoung 			(void)m_free(*mp);
   1485  1.121    dyoung 		return ENOPROTOOPT;
   1486  1.121    dyoung 	}
   1487  1.121    dyoung 	switch (op) {
   1488  1.121    dyoung 	case PRCO_SETOPT:
   1489  1.121    dyoung 		switch (optname) {
   1490   1.97    rpaulo #ifdef RFC2292
   1491  1.121    dyoung 		case IPV6_2292PKTOPTIONS:
   1492  1.121    dyoung 			/* m is freed in ip6_pcbopts */
   1493  1.121    dyoung 			error = ip6_pcbopts(&in6p->in6p_outputopts,
   1494  1.121    dyoung 			    m, so);
   1495  1.121    dyoung 			break;
   1496  1.121    dyoung #endif
   1497  1.121    dyoung 
   1498  1.121    dyoung 		/*
   1499  1.121    dyoung 		 * Use of some Hop-by-Hop options or some
   1500  1.121    dyoung 		 * Destination options, might require special
   1501  1.121    dyoung 		 * privilege.  That is, normal applications
   1502  1.121    dyoung 		 * (without special privilege) might be forbidden
   1503  1.121    dyoung 		 * from setting certain options in outgoing packets,
   1504  1.121    dyoung 		 * and might never see certain options in received
   1505  1.121    dyoung 		 * packets. [RFC 2292 Section 6]
   1506  1.121    dyoung 		 * KAME specific note:
   1507  1.121    dyoung 		 *  KAME prevents non-privileged users from sending or
   1508  1.121    dyoung 		 *  receiving ANY hbh/dst options in order to avoid
   1509  1.121    dyoung 		 *  overhead of parsing options in the kernel.
   1510  1.121    dyoung 		 */
   1511  1.121    dyoung 		case IPV6_RECVHOPOPTS:
   1512  1.121    dyoung 		case IPV6_RECVDSTOPTS:
   1513  1.121    dyoung 		case IPV6_RECVRTHDRDSTOPTS:
   1514  1.121    dyoung 			if (!privileged) {
   1515  1.121    dyoung 				error = EPERM;
   1516  1.121    dyoung 				break;
   1517  1.121    dyoung 			}
   1518  1.121    dyoung 			/* FALLTHROUGH */
   1519  1.121    dyoung 		case IPV6_UNICAST_HOPS:
   1520  1.121    dyoung 		case IPV6_HOPLIMIT:
   1521  1.121    dyoung 		case IPV6_FAITH:
   1522  1.121    dyoung 
   1523  1.121    dyoung 		case IPV6_RECVPKTINFO:
   1524  1.121    dyoung 		case IPV6_RECVHOPLIMIT:
   1525  1.121    dyoung 		case IPV6_RECVRTHDR:
   1526  1.121    dyoung 		case IPV6_RECVPATHMTU:
   1527  1.121    dyoung 		case IPV6_RECVTCLASS:
   1528  1.121    dyoung 		case IPV6_V6ONLY:
   1529  1.121    dyoung 			if (optlen != sizeof(int)) {
   1530  1.121    dyoung 				error = EINVAL;
   1531   1.97    rpaulo 				break;
   1532  1.121    dyoung 			}
   1533  1.121    dyoung 			optval = *mtod(m, int *);
   1534  1.121    dyoung 			switch (optname) {
   1535   1.97    rpaulo 
   1536    1.2    itojun 			case IPV6_UNICAST_HOPS:
   1537  1.121    dyoung 				if (optval < -1 || optval >= 256)
   1538    1.2    itojun 					error = EINVAL;
   1539  1.121    dyoung 				else {
   1540  1.121    dyoung 					/* -1 = kernel default */
   1541  1.121    dyoung 					in6p->in6p_hops = optval;
   1542   1.37    itojun 				}
   1543  1.121    dyoung 				break;
   1544    1.2    itojun #define OPTSET(bit) \
   1545   1.49    itojun do { \
   1546  1.121    dyoung if (optval) \
   1547  1.121    dyoung 	in6p->in6p_flags |= (bit); \
   1548  1.121    dyoung else \
   1549  1.121    dyoung 	in6p->in6p_flags &= ~(bit); \
   1550   1.60     perry } while (/*CONSTCOND*/ 0)
   1551    1.2    itojun 
   1552   1.97    rpaulo #ifdef RFC2292
   1553   1.97    rpaulo #define OPTSET2292(bit) 			\
   1554   1.97    rpaulo do { 						\
   1555  1.121    dyoung in6p->in6p_flags |= IN6P_RFC2292; 	\
   1556  1.121    dyoung if (optval) 				\
   1557  1.121    dyoung 	in6p->in6p_flags |= (bit); 	\
   1558  1.121    dyoung else 					\
   1559  1.121    dyoung 	in6p->in6p_flags &= ~(bit); 	\
   1560   1.97    rpaulo } while (/*CONSTCOND*/ 0)
   1561   1.97    rpaulo #endif
   1562   1.97    rpaulo 
   1563   1.97    rpaulo #define OPTBIT(bit) (in6p->in6p_flags & (bit) ? 1 : 0)
   1564    1.2    itojun 
   1565  1.121    dyoung 			case IPV6_RECVPKTINFO:
   1566   1.97    rpaulo #ifdef RFC2292
   1567  1.121    dyoung 				/* cannot mix with RFC2292 */
   1568  1.121    dyoung 				if (OPTBIT(IN6P_RFC2292)) {
   1569  1.121    dyoung 					error = EINVAL;
   1570  1.121    dyoung 					break;
   1571  1.121    dyoung 				}
   1572   1.97    rpaulo #endif
   1573  1.121    dyoung 				OPTSET(IN6P_PKTINFO);
   1574  1.121    dyoung 				break;
   1575  1.121    dyoung 
   1576  1.121    dyoung 			case IPV6_HOPLIMIT:
   1577  1.121    dyoung 			{
   1578  1.121    dyoung 				struct ip6_pktopts **optp;
   1579    1.2    itojun 
   1580  1.121    dyoung #ifdef RFC2292
   1581  1.121    dyoung 				/* cannot mix with RFC2292 */
   1582  1.121    dyoung 				if (OPTBIT(IN6P_RFC2292)) {
   1583  1.121    dyoung 					error = EINVAL;
   1584   1.37    itojun 					break;
   1585   1.97    rpaulo 				}
   1586  1.121    dyoung #endif
   1587  1.121    dyoung 				optp = &in6p->in6p_outputopts;
   1588  1.121    dyoung 				error = ip6_pcbopt(IPV6_HOPLIMIT,
   1589  1.121    dyoung 						   (u_char *)&optval,
   1590  1.121    dyoung 						   sizeof(optval),
   1591  1.121    dyoung 						   optp,
   1592  1.121    dyoung 						   privileged, uproto);
   1593  1.121    dyoung 				break;
   1594  1.121    dyoung 			}
   1595    1.2    itojun 
   1596  1.121    dyoung 			case IPV6_RECVHOPLIMIT:
   1597   1.97    rpaulo #ifdef RFC2292
   1598  1.121    dyoung 				/* cannot mix with RFC2292 */
   1599  1.121    dyoung 				if (OPTBIT(IN6P_RFC2292)) {
   1600  1.121    dyoung 					error = EINVAL;
   1601  1.121    dyoung 					break;
   1602  1.121    dyoung 				}
   1603   1.97    rpaulo #endif
   1604  1.121    dyoung 				OPTSET(IN6P_HOPLIMIT);
   1605  1.121    dyoung 				break;
   1606    1.2    itojun 
   1607  1.121    dyoung 			case IPV6_RECVHOPOPTS:
   1608   1.97    rpaulo #ifdef RFC2292
   1609  1.121    dyoung 				/* cannot mix with RFC2292 */
   1610  1.121    dyoung 				if (OPTBIT(IN6P_RFC2292)) {
   1611  1.121    dyoung 					error = EINVAL;
   1612  1.121    dyoung 					break;
   1613  1.121    dyoung 				}
   1614   1.97    rpaulo #endif
   1615  1.121    dyoung 				OPTSET(IN6P_HOPOPTS);
   1616  1.121    dyoung 				break;
   1617    1.2    itojun 
   1618  1.121    dyoung 			case IPV6_RECVDSTOPTS:
   1619   1.97    rpaulo #ifdef RFC2292
   1620  1.121    dyoung 				/* cannot mix with RFC2292 */
   1621  1.121    dyoung 				if (OPTBIT(IN6P_RFC2292)) {
   1622  1.121    dyoung 					error = EINVAL;
   1623  1.121    dyoung 					break;
   1624  1.121    dyoung 				}
   1625   1.97    rpaulo #endif
   1626  1.121    dyoung 				OPTSET(IN6P_DSTOPTS);
   1627  1.121    dyoung 				break;
   1628    1.2    itojun 
   1629  1.121    dyoung 			case IPV6_RECVRTHDRDSTOPTS:
   1630   1.97    rpaulo #ifdef RFC2292
   1631  1.121    dyoung 				/* cannot mix with RFC2292 */
   1632  1.121    dyoung 				if (OPTBIT(IN6P_RFC2292)) {
   1633  1.121    dyoung 					error = EINVAL;
   1634  1.121    dyoung 					break;
   1635  1.121    dyoung 				}
   1636   1.97    rpaulo #endif
   1637  1.121    dyoung 				OPTSET(IN6P_RTHDRDSTOPTS);
   1638  1.121    dyoung 				break;
   1639   1.97    rpaulo 
   1640  1.121    dyoung 			case IPV6_RECVRTHDR:
   1641   1.97    rpaulo #ifdef RFC2292
   1642  1.121    dyoung 				/* cannot mix with RFC2292 */
   1643  1.121    dyoung 				if (OPTBIT(IN6P_RFC2292)) {
   1644  1.121    dyoung 					error = EINVAL;
   1645  1.121    dyoung 					break;
   1646  1.121    dyoung 				}
   1647   1.97    rpaulo #endif
   1648  1.121    dyoung 				OPTSET(IN6P_RTHDR);
   1649  1.121    dyoung 				break;
   1650  1.121    dyoung 
   1651  1.121    dyoung 			case IPV6_FAITH:
   1652  1.121    dyoung 				OPTSET(IN6P_FAITH);
   1653  1.121    dyoung 				break;
   1654    1.2    itojun 
   1655  1.121    dyoung 			case IPV6_RECVPATHMTU:
   1656  1.121    dyoung 				/*
   1657  1.121    dyoung 				 * We ignore this option for TCP
   1658  1.121    dyoung 				 * sockets.
   1659  1.121    dyoung 				 * (RFC3542 leaves this case
   1660  1.121    dyoung 				 * unspecified.)
   1661  1.121    dyoung 				 */
   1662  1.121    dyoung 				if (uproto != IPPROTO_TCP)
   1663  1.121    dyoung 					OPTSET(IN6P_MTU);
   1664  1.121    dyoung 				break;
   1665   1.10    itojun 
   1666  1.121    dyoung 			case IPV6_V6ONLY:
   1667  1.121    dyoung 				/*
   1668  1.121    dyoung 				 * make setsockopt(IPV6_V6ONLY)
   1669  1.121    dyoung 				 * available only prior to bind(2).
   1670  1.121    dyoung 				 * see ipng mailing list, Jun 22 2001.
   1671  1.121    dyoung 				 */
   1672  1.121    dyoung 				if (in6p->in6p_lport ||
   1673  1.121    dyoung 				    !IN6_IS_ADDR_UNSPECIFIED(&in6p->in6p_laddr)) {
   1674  1.121    dyoung 					error = EINVAL;
   1675   1.83    itojun 					break;
   1676  1.121    dyoung 				}
   1677   1.37    itojun #ifdef INET6_BINDV6ONLY
   1678  1.121    dyoung 				if (!optval)
   1679  1.121    dyoung 					error = EINVAL;
   1680   1.37    itojun #else
   1681  1.121    dyoung 				OPTSET(IN6P_IPV6_V6ONLY);
   1682   1.10    itojun #endif
   1683  1.121    dyoung 				break;
   1684  1.121    dyoung 			case IPV6_RECVTCLASS:
   1685  1.121    dyoung #ifdef RFC2292
   1686  1.121    dyoung 				/* cannot mix with RFC2292 XXX */
   1687  1.121    dyoung 				if (OPTBIT(IN6P_RFC2292)) {
   1688  1.121    dyoung 					error = EINVAL;
   1689   1.37    itojun 					break;
   1690  1.121    dyoung 				}
   1691   1.97    rpaulo #endif
   1692  1.121    dyoung 				OPTSET(IN6P_TCLASS);
   1693  1.121    dyoung 				break;
   1694  1.121    dyoung 
   1695  1.121    dyoung 			}
   1696  1.121    dyoung 			break;
   1697  1.121    dyoung 
   1698  1.121    dyoung 		case IPV6_OTCLASS:
   1699  1.121    dyoung 		{
   1700  1.121    dyoung 			struct ip6_pktopts **optp;
   1701  1.121    dyoung 			u_int8_t tclass;
   1702   1.97    rpaulo 
   1703  1.121    dyoung 			if (optlen != sizeof(tclass)) {
   1704  1.121    dyoung 				error = EINVAL;
   1705   1.97    rpaulo 				break;
   1706  1.121    dyoung 			}
   1707  1.121    dyoung 			tclass = *mtod(m, u_int8_t *);
   1708  1.121    dyoung 			optp = &in6p->in6p_outputopts;
   1709  1.121    dyoung 			error = ip6_pcbopt(optname,
   1710  1.121    dyoung 					   (u_char *)&tclass,
   1711  1.121    dyoung 					   sizeof(tclass),
   1712  1.121    dyoung 					   optp,
   1713  1.121    dyoung 					   privileged, uproto);
   1714  1.121    dyoung 			break;
   1715  1.121    dyoung 		}
   1716   1.97    rpaulo 
   1717  1.121    dyoung 		case IPV6_TCLASS:
   1718  1.121    dyoung 		case IPV6_DONTFRAG:
   1719  1.121    dyoung 		case IPV6_USE_MIN_MTU:
   1720  1.121    dyoung 			if (optlen != sizeof(optval)) {
   1721  1.121    dyoung 				error = EINVAL;
   1722  1.121    dyoung 				break;
   1723  1.121    dyoung 			}
   1724  1.121    dyoung 			optval = *mtod(m, int *);
   1725   1.97    rpaulo 			{
   1726   1.97    rpaulo 				struct ip6_pktopts **optp;
   1727   1.97    rpaulo 				optp = &in6p->in6p_outputopts;
   1728   1.97    rpaulo 				error = ip6_pcbopt(optname,
   1729  1.121    dyoung 						   (u_char *)&optval,
   1730  1.121    dyoung 						   sizeof(optval),
   1731   1.97    rpaulo 						   optp,
   1732   1.97    rpaulo 						   privileged, uproto);
   1733   1.97    rpaulo 				break;
   1734   1.97    rpaulo 			}
   1735   1.97    rpaulo 
   1736   1.97    rpaulo #ifdef RFC2292
   1737  1.121    dyoung 		case IPV6_2292PKTINFO:
   1738  1.121    dyoung 		case IPV6_2292HOPLIMIT:
   1739  1.121    dyoung 		case IPV6_2292HOPOPTS:
   1740  1.121    dyoung 		case IPV6_2292DSTOPTS:
   1741  1.121    dyoung 		case IPV6_2292RTHDR:
   1742  1.121    dyoung 			/* RFC 2292 */
   1743  1.121    dyoung 			if (optlen != sizeof(int)) {
   1744  1.121    dyoung 				error = EINVAL;
   1745  1.121    dyoung 				break;
   1746  1.121    dyoung 			}
   1747  1.121    dyoung 			optval = *mtod(m, int *);
   1748  1.121    dyoung 			switch (optname) {
   1749   1.97    rpaulo 			case IPV6_2292PKTINFO:
   1750  1.121    dyoung 				OPTSET2292(IN6P_PKTINFO);
   1751  1.121    dyoung 				break;
   1752   1.97    rpaulo 			case IPV6_2292HOPLIMIT:
   1753  1.121    dyoung 				OPTSET2292(IN6P_HOPLIMIT);
   1754  1.121    dyoung 				break;
   1755   1.97    rpaulo 			case IPV6_2292HOPOPTS:
   1756  1.121    dyoung 				/*
   1757  1.121    dyoung 				 * Check super-user privilege.
   1758  1.121    dyoung 				 * See comments for IPV6_RECVHOPOPTS.
   1759  1.121    dyoung 				 */
   1760  1.121    dyoung 				if (!privileged)
   1761  1.121    dyoung 					return (EPERM);
   1762  1.121    dyoung 				OPTSET2292(IN6P_HOPOPTS);
   1763  1.121    dyoung 				break;
   1764   1.97    rpaulo 			case IPV6_2292DSTOPTS:
   1765  1.121    dyoung 				if (!privileged)
   1766  1.121    dyoung 					return (EPERM);
   1767  1.121    dyoung 				OPTSET2292(IN6P_DSTOPTS|IN6P_RTHDRDSTOPTS); /* XXX */
   1768  1.121    dyoung 				break;
   1769   1.97    rpaulo 			case IPV6_2292RTHDR:
   1770  1.121    dyoung 				OPTSET2292(IN6P_RTHDR);
   1771   1.97    rpaulo 				break;
   1772  1.121    dyoung 			}
   1773  1.121    dyoung 			break;
   1774   1.97    rpaulo #endif
   1775  1.121    dyoung 		case IPV6_PKTINFO:
   1776  1.121    dyoung 		case IPV6_HOPOPTS:
   1777  1.121    dyoung 		case IPV6_RTHDR:
   1778  1.121    dyoung 		case IPV6_DSTOPTS:
   1779  1.121    dyoung 		case IPV6_RTHDRDSTOPTS:
   1780  1.121    dyoung 		case IPV6_NEXTHOP:
   1781  1.121    dyoung 		{
   1782  1.121    dyoung 			/* new advanced API (RFC3542) */
   1783  1.121    dyoung 			u_char *optbuf;
   1784  1.121    dyoung 			int optbuflen;
   1785  1.121    dyoung 			struct ip6_pktopts **optp;
   1786  1.121    dyoung 			if (!m) {
   1787  1.121    dyoung 				error = EINVAL;
   1788  1.121    dyoung 				break;
   1789  1.121    dyoung 			}
   1790   1.97    rpaulo 
   1791   1.97    rpaulo #ifdef RFC2292
   1792  1.121    dyoung 			/* cannot mix with RFC2292 */
   1793  1.121    dyoung 			if (OPTBIT(IN6P_RFC2292)) {
   1794  1.121    dyoung 				error = EINVAL;
   1795  1.121    dyoung 				break;
   1796  1.121    dyoung 			}
   1797   1.97    rpaulo #endif
   1798   1.97    rpaulo 
   1799  1.121    dyoung 			if (m && m->m_next) {
   1800  1.121    dyoung 				error = EINVAL;	/* XXX */
   1801    1.2    itojun 				break;
   1802   1.97    rpaulo 			}
   1803  1.121    dyoung 
   1804  1.121    dyoung 			optbuf = mtod(m, u_char *);
   1805  1.121    dyoung 			optbuflen = m->m_len;
   1806  1.121    dyoung 			optp = &in6p->in6p_outputopts;
   1807  1.121    dyoung 			error = ip6_pcbopt(optname, optbuf, optbuflen,
   1808  1.121    dyoung 			    optp, privileged, uproto);
   1809  1.121    dyoung 			break;
   1810  1.121    dyoung 		}
   1811    1.2    itojun #undef OPTSET
   1812    1.2    itojun 
   1813  1.121    dyoung 		case IPV6_MULTICAST_IF:
   1814  1.121    dyoung 		case IPV6_MULTICAST_HOPS:
   1815  1.121    dyoung 		case IPV6_MULTICAST_LOOP:
   1816  1.121    dyoung 		case IPV6_JOIN_GROUP:
   1817  1.121    dyoung 		case IPV6_LEAVE_GROUP:
   1818  1.121    dyoung 			error = ip6_setmoptions(optname,
   1819  1.121    dyoung 			    &in6p->in6p_moptions, m);
   1820  1.121    dyoung 			break;
   1821  1.121    dyoung 
   1822  1.121    dyoung 		case IPV6_PORTRANGE:
   1823  1.121    dyoung 			if (!m) {
   1824  1.121    dyoung 				error = EINVAL;
   1825    1.2    itojun 				break;
   1826  1.121    dyoung 			}
   1827  1.121    dyoung 			optval = *mtod(m, int *);
   1828    1.2    itojun 
   1829  1.121    dyoung 			switch (optval) {
   1830  1.121    dyoung 			case IPV6_PORTRANGE_DEFAULT:
   1831  1.121    dyoung 				in6p->in6p_flags &= ~(IN6P_LOWPORT);
   1832  1.121    dyoung 				in6p->in6p_flags &= ~(IN6P_HIGHPORT);
   1833  1.121    dyoung 				break;
   1834   1.12    itojun 
   1835  1.121    dyoung 			case IPV6_PORTRANGE_HIGH:
   1836  1.121    dyoung 				in6p->in6p_flags &= ~(IN6P_LOWPORT);
   1837  1.121    dyoung 				in6p->in6p_flags |= IN6P_HIGHPORT;
   1838  1.121    dyoung 				break;
   1839   1.12    itojun 
   1840  1.121    dyoung 			case IPV6_PORTRANGE_LOW:
   1841  1.121    dyoung 				in6p->in6p_flags &= ~(IN6P_HIGHPORT);
   1842  1.121    dyoung 				in6p->in6p_flags |= IN6P_LOWPORT;
   1843  1.121    dyoung 				break;
   1844   1.12    itojun 
   1845  1.121    dyoung 			default:
   1846  1.121    dyoung 				error = EINVAL;
   1847   1.12    itojun 				break;
   1848  1.121    dyoung 			}
   1849  1.121    dyoung 			break;
   1850   1.12    itojun 
   1851  1.114  degroote 
   1852  1.114  degroote #if defined(IPSEC) || defined(FAST_IPSEC)
   1853  1.121    dyoung 		case IPV6_IPSEC_POLICY:
   1854  1.121    dyoung 		{
   1855  1.121    dyoung 			void *req = NULL;
   1856  1.121    dyoung 			size_t len = 0;
   1857  1.121    dyoung 			if (m) {
   1858  1.121    dyoung 				req = mtod(m, void *);
   1859  1.121    dyoung 				len = m->m_len;
   1860   1.97    rpaulo 			}
   1861  1.121    dyoung 			error = ipsec6_set_policy(in6p, optname, req,
   1862  1.121    dyoung 						  len, privileged);
   1863  1.121    dyoung 		}
   1864  1.121    dyoung 			break;
   1865    1.2    itojun #endif /* IPSEC */
   1866    1.2    itojun 
   1867  1.121    dyoung 		default:
   1868  1.121    dyoung 			error = ENOPROTOOPT;
   1869    1.2    itojun 			break;
   1870  1.121    dyoung 		}
   1871  1.121    dyoung 		if (m)
   1872  1.121    dyoung 			(void)m_free(m);
   1873  1.121    dyoung 		break;
   1874    1.2    itojun 
   1875  1.121    dyoung 	case PRCO_GETOPT:
   1876  1.121    dyoung 		switch (optname) {
   1877   1.97    rpaulo #ifdef RFC2292
   1878  1.121    dyoung 		case IPV6_2292PKTOPTIONS:
   1879  1.121    dyoung 			/*
   1880  1.121    dyoung 			 * RFC3542 (effectively) deprecated the
   1881  1.121    dyoung 			 * semantics of the 2292-style pktoptions.
   1882  1.121    dyoung 			 * Since it was not reliable in nature (i.e.,
   1883  1.121    dyoung 			 * applications had to expect the lack of some
   1884  1.121    dyoung 			 * information after all), it would make sense
   1885  1.121    dyoung 			 * to simplify this part by always returning
   1886  1.121    dyoung 			 * empty data.
   1887  1.121    dyoung 			 */
   1888  1.121    dyoung 			*mp = m_get(M_WAIT, MT_SOOPTS);
   1889  1.121    dyoung 			(*mp)->m_len = 0;
   1890  1.121    dyoung 			break;
   1891   1.97    rpaulo #endif
   1892    1.2    itojun 
   1893  1.121    dyoung 		case IPV6_RECVHOPOPTS:
   1894  1.121    dyoung 		case IPV6_RECVDSTOPTS:
   1895  1.121    dyoung 		case IPV6_RECVRTHDRDSTOPTS:
   1896  1.121    dyoung 		case IPV6_UNICAST_HOPS:
   1897  1.121    dyoung 		case IPV6_RECVPKTINFO:
   1898  1.121    dyoung 		case IPV6_RECVHOPLIMIT:
   1899  1.121    dyoung 		case IPV6_RECVRTHDR:
   1900  1.121    dyoung 		case IPV6_RECVPATHMTU:
   1901  1.121    dyoung 
   1902  1.121    dyoung 		case IPV6_FAITH:
   1903  1.121    dyoung 		case IPV6_V6ONLY:
   1904  1.121    dyoung 		case IPV6_PORTRANGE:
   1905  1.121    dyoung 		case IPV6_RECVTCLASS:
   1906  1.121    dyoung 			switch (optname) {
   1907  1.121    dyoung 
   1908   1.97    rpaulo 			case IPV6_RECVHOPOPTS:
   1909  1.121    dyoung 				optval = OPTBIT(IN6P_HOPOPTS);
   1910  1.121    dyoung 				break;
   1911  1.121    dyoung 
   1912   1.97    rpaulo 			case IPV6_RECVDSTOPTS:
   1913  1.121    dyoung 				optval = OPTBIT(IN6P_DSTOPTS);
   1914  1.121    dyoung 				break;
   1915  1.121    dyoung 
   1916   1.97    rpaulo 			case IPV6_RECVRTHDRDSTOPTS:
   1917  1.121    dyoung 				optval = OPTBIT(IN6P_RTHDRDSTOPTS);
   1918  1.121    dyoung 				break;
   1919  1.121    dyoung 
   1920   1.97    rpaulo 			case IPV6_UNICAST_HOPS:
   1921  1.121    dyoung 				optval = in6p->in6p_hops;
   1922  1.121    dyoung 				break;
   1923  1.121    dyoung 
   1924   1.97    rpaulo 			case IPV6_RECVPKTINFO:
   1925  1.121    dyoung 				optval = OPTBIT(IN6P_PKTINFO);
   1926  1.121    dyoung 				break;
   1927  1.121    dyoung 
   1928   1.97    rpaulo 			case IPV6_RECVHOPLIMIT:
   1929  1.121    dyoung 				optval = OPTBIT(IN6P_HOPLIMIT);
   1930  1.121    dyoung 				break;
   1931  1.121    dyoung 
   1932   1.97    rpaulo 			case IPV6_RECVRTHDR:
   1933  1.121    dyoung 				optval = OPTBIT(IN6P_RTHDR);
   1934  1.121    dyoung 				break;
   1935  1.121    dyoung 
   1936   1.97    rpaulo 			case IPV6_RECVPATHMTU:
   1937  1.121    dyoung 				optval = OPTBIT(IN6P_MTU);
   1938  1.121    dyoung 				break;
   1939    1.2    itojun 
   1940    1.2    itojun 			case IPV6_FAITH:
   1941  1.121    dyoung 				optval = OPTBIT(IN6P_FAITH);
   1942  1.121    dyoung 				break;
   1943  1.121    dyoung 
   1944   1.37    itojun 			case IPV6_V6ONLY:
   1945  1.121    dyoung 				optval = OPTBIT(IN6P_IPV6_V6ONLY);
   1946  1.121    dyoung 				break;
   1947  1.121    dyoung 
   1948   1.97    rpaulo 			case IPV6_PORTRANGE:
   1949  1.121    dyoung 			    {
   1950  1.121    dyoung 				int flags;
   1951  1.121    dyoung 				flags = in6p->in6p_flags;
   1952  1.121    dyoung 				if (flags & IN6P_HIGHPORT)
   1953  1.121    dyoung 					optval = IPV6_PORTRANGE_HIGH;
   1954  1.121    dyoung 				else if (flags & IN6P_LOWPORT)
   1955  1.121    dyoung 					optval = IPV6_PORTRANGE_LOW;
   1956  1.121    dyoung 				else
   1957  1.121    dyoung 					optval = 0;
   1958  1.121    dyoung 				break;
   1959  1.121    dyoung 			    }
   1960   1.97    rpaulo 			case IPV6_RECVTCLASS:
   1961  1.121    dyoung 				optval = OPTBIT(IN6P_TCLASS);
   1962  1.121    dyoung 				break;
   1963    1.2    itojun 
   1964  1.121    dyoung 			}
   1965  1.121    dyoung 			if (error)
   1966   1.97    rpaulo 				break;
   1967  1.121    dyoung 			*mp = m = m_get(M_WAIT, MT_SOOPTS);
   1968  1.121    dyoung 			m->m_len = sizeof(int);
   1969  1.121    dyoung 			*mtod(m, int *) = optval;
   1970  1.121    dyoung 			break;
   1971   1.97    rpaulo 
   1972  1.121    dyoung 		case IPV6_PATHMTU:
   1973  1.121    dyoung 		    {
   1974  1.121    dyoung 			u_long pmtu = 0;
   1975  1.121    dyoung 			struct ip6_mtuinfo mtuinfo;
   1976  1.121    dyoung 			struct route *ro = &in6p->in6p_route;
   1977    1.2    itojun 
   1978  1.121    dyoung 			if (!(so->so_state & SS_ISCONNECTED))
   1979  1.121    dyoung 				return (ENOTCONN);
   1980  1.121    dyoung 			/*
   1981  1.121    dyoung 			 * XXX: we dot not consider the case of source
   1982  1.121    dyoung 			 * routing, or optional information to specify
   1983  1.121    dyoung 			 * the outgoing interface.
   1984  1.121    dyoung 			 */
   1985  1.121    dyoung 			error = ip6_getpmtu(ro, NULL, NULL,
   1986  1.121    dyoung 			    &in6p->in6p_faddr, &pmtu, NULL);
   1987  1.121    dyoung 			if (error)
   1988  1.121    dyoung 				break;
   1989  1.121    dyoung 			if (pmtu > IPV6_MAXPACKET)
   1990  1.121    dyoung 				pmtu = IPV6_MAXPACKET;
   1991  1.121    dyoung 
   1992  1.121    dyoung 			memset(&mtuinfo, 0, sizeof(mtuinfo));
   1993  1.121    dyoung 			mtuinfo.ip6m_mtu = (u_int32_t)pmtu;
   1994  1.121    dyoung 			optdata = (void *)&mtuinfo;
   1995  1.121    dyoung 			optdatalen = sizeof(mtuinfo);
   1996  1.121    dyoung 			if (optdatalen > MCLBYTES)
   1997  1.121    dyoung 				return (EMSGSIZE); /* XXX */
   1998  1.121    dyoung 			*mp = m = m_get(M_WAIT, MT_SOOPTS);
   1999  1.121    dyoung 			if (optdatalen > MLEN)
   2000  1.121    dyoung 				MCLGET(m, M_WAIT);
   2001  1.121    dyoung 			m->m_len = optdatalen;
   2002  1.121    dyoung 			memcpy(mtod(m, void *), optdata, optdatalen);
   2003  1.121    dyoung 			break;
   2004  1.121    dyoung 		    }
   2005   1.97    rpaulo 
   2006   1.97    rpaulo #ifdef RFC2292
   2007  1.121    dyoung 		case IPV6_2292PKTINFO:
   2008  1.121    dyoung 		case IPV6_2292HOPLIMIT:
   2009  1.121    dyoung 		case IPV6_2292HOPOPTS:
   2010  1.121    dyoung 		case IPV6_2292RTHDR:
   2011  1.121    dyoung 		case IPV6_2292DSTOPTS:
   2012  1.121    dyoung 			switch (optname) {
   2013   1.97    rpaulo 			case IPV6_2292PKTINFO:
   2014  1.121    dyoung 				optval = OPTBIT(IN6P_PKTINFO);
   2015  1.121    dyoung 				break;
   2016   1.97    rpaulo 			case IPV6_2292HOPLIMIT:
   2017  1.121    dyoung 				optval = OPTBIT(IN6P_HOPLIMIT);
   2018  1.121    dyoung 				break;
   2019   1.97    rpaulo 			case IPV6_2292HOPOPTS:
   2020  1.121    dyoung 				optval = OPTBIT(IN6P_HOPOPTS);
   2021  1.121    dyoung 				break;
   2022   1.97    rpaulo 			case IPV6_2292RTHDR:
   2023  1.121    dyoung 				optval = OPTBIT(IN6P_RTHDR);
   2024  1.121    dyoung 				break;
   2025   1.97    rpaulo 			case IPV6_2292DSTOPTS:
   2026  1.121    dyoung 				optval = OPTBIT(IN6P_DSTOPTS|IN6P_RTHDRDSTOPTS);
   2027    1.2    itojun 				break;
   2028  1.121    dyoung 			}
   2029  1.121    dyoung 			*mp = m = m_get(M_WAIT, MT_SOOPTS);
   2030  1.121    dyoung 			m->m_len = sizeof(int);
   2031  1.121    dyoung 			*mtod(m, int *) = optval;
   2032  1.121    dyoung 			break;
   2033  1.121    dyoung #endif
   2034  1.121    dyoung 		case IPV6_PKTINFO:
   2035  1.121    dyoung 		case IPV6_HOPOPTS:
   2036  1.121    dyoung 		case IPV6_RTHDR:
   2037  1.121    dyoung 		case IPV6_DSTOPTS:
   2038  1.121    dyoung 		case IPV6_RTHDRDSTOPTS:
   2039  1.121    dyoung 		case IPV6_NEXTHOP:
   2040  1.121    dyoung 		case IPV6_OTCLASS:
   2041  1.121    dyoung 		case IPV6_TCLASS:
   2042  1.121    dyoung 		case IPV6_DONTFRAG:
   2043  1.121    dyoung 		case IPV6_USE_MIN_MTU:
   2044  1.121    dyoung 			error = ip6_getpcbopt(in6p->in6p_outputopts,
   2045  1.121    dyoung 			    optname, mp);
   2046  1.121    dyoung 			break;
   2047  1.121    dyoung 
   2048  1.121    dyoung 		case IPV6_MULTICAST_IF:
   2049  1.121    dyoung 		case IPV6_MULTICAST_HOPS:
   2050  1.121    dyoung 		case IPV6_MULTICAST_LOOP:
   2051  1.121    dyoung 		case IPV6_JOIN_GROUP:
   2052  1.121    dyoung 		case IPV6_LEAVE_GROUP:
   2053  1.121    dyoung 			error = ip6_getmoptions(optname,
   2054  1.121    dyoung 			    in6p->in6p_moptions, mp);
   2055  1.121    dyoung 			break;
   2056    1.2    itojun 
   2057  1.114  degroote #if defined(IPSEC) || defined(FAST_IPSEC)
   2058  1.121    dyoung 		case IPV6_IPSEC_POLICY:
   2059  1.121    dyoung 		    {
   2060  1.121    dyoung 			void *req = NULL;
   2061  1.121    dyoung 			size_t len = 0;
   2062  1.121    dyoung 			if (m) {
   2063  1.121    dyoung 				req = mtod(m, void *);
   2064  1.121    dyoung 				len = m->m_len;
   2065  1.121    dyoung 			}
   2066  1.121    dyoung 			error = ipsec6_get_policy(in6p, req, len, mp);
   2067  1.121    dyoung 			break;
   2068  1.121    dyoung 		    }
   2069    1.2    itojun #endif /* IPSEC */
   2070    1.2    itojun 
   2071   1.97    rpaulo 
   2072   1.97    rpaulo 
   2073   1.97    rpaulo 
   2074  1.121    dyoung 		default:
   2075  1.121    dyoung 			error = ENOPROTOOPT;
   2076    1.2    itojun 			break;
   2077    1.2    itojun 		}
   2078  1.121    dyoung 		break;
   2079    1.2    itojun 	}
   2080   1.57    itojun 	return (error);
   2081   1.53    itojun }
   2082   1.53    itojun 
   2083   1.53    itojun int
   2084  1.119  christos ip6_raw_ctloutput(int op, struct socket *so, int level, int optname,
   2085  1.119  christos 	struct mbuf **mp)
   2086   1.53    itojun {
   2087   1.53    itojun 	int error = 0, optval, optlen;
   2088   1.53    itojun 	const int icmp6off = offsetof(struct icmp6_hdr, icmp6_cksum);
   2089   1.53    itojun 	struct in6pcb *in6p = sotoin6pcb(so);
   2090   1.53    itojun 	struct mbuf *m = *mp;
   2091   1.53    itojun 
   2092   1.53    itojun 	optlen = m ? m->m_len : 0;
   2093   1.53    itojun 
   2094   1.53    itojun 	if (level != IPPROTO_IPV6) {
   2095   1.53    itojun 		if (op == PRCO_SETOPT && *mp)
   2096   1.53    itojun 			(void)m_free(*mp);
   2097  1.121    dyoung 		return ENOPROTOOPT;
   2098   1.53    itojun 	}
   2099   1.55    itojun 
   2100   1.53    itojun 	switch (optname) {
   2101   1.53    itojun 	case IPV6_CHECKSUM:
   2102   1.53    itojun 		/*
   2103   1.53    itojun 		 * For ICMPv6 sockets, no modification allowed for checksum
   2104   1.53    itojun 		 * offset, permit "no change" values to help existing apps.
   2105   1.53    itojun 		 *
   2106   1.97    rpaulo 		 * XXX RFC3542 says: "An attempt to set IPV6_CHECKSUM
   2107   1.97    rpaulo 		 * for an ICMPv6 socket will fail."  The current
   2108   1.97    rpaulo 		 * behavior does not meet RFC3542.
   2109   1.53    itojun 		 */
   2110   1.53    itojun 		switch (op) {
   2111   1.53    itojun 		case PRCO_SETOPT:
   2112   1.53    itojun 			if (optlen != sizeof(int)) {
   2113   1.53    itojun 				error = EINVAL;
   2114   1.53    itojun 				break;
   2115   1.53    itojun 			}
   2116   1.53    itojun 			optval = *mtod(m, int *);
   2117   1.53    itojun 			if ((optval % 2) != 0) {
   2118   1.53    itojun 				/* the API assumes even offset values */
   2119   1.53    itojun 				error = EINVAL;
   2120   1.53    itojun 			} else if (so->so_proto->pr_protocol ==
   2121   1.53    itojun 			    IPPROTO_ICMPV6) {
   2122   1.53    itojun 				if (optval != icmp6off)
   2123   1.53    itojun 					error = EINVAL;
   2124   1.53    itojun 			} else
   2125   1.53    itojun 				in6p->in6p_cksum = optval;
   2126   1.53    itojun 			break;
   2127   1.53    itojun 
   2128   1.53    itojun 		case PRCO_GETOPT:
   2129   1.53    itojun 			if (so->so_proto->pr_protocol == IPPROTO_ICMPV6)
   2130   1.53    itojun 				optval = icmp6off;
   2131   1.53    itojun 			else
   2132   1.53    itojun 				optval = in6p->in6p_cksum;
   2133   1.53    itojun 
   2134   1.53    itojun 			*mp = m = m_get(M_WAIT, MT_SOOPTS);
   2135   1.53    itojun 			m->m_len = sizeof(int);
   2136   1.53    itojun 			*mtod(m, int *) = optval;
   2137   1.53    itojun 			break;
   2138   1.53    itojun 
   2139   1.53    itojun 		default:
   2140   1.53    itojun 			error = EINVAL;
   2141   1.53    itojun 			break;
   2142   1.53    itojun 		}
   2143   1.53    itojun 		break;
   2144   1.53    itojun 
   2145   1.53    itojun 	default:
   2146   1.53    itojun 		error = ENOPROTOOPT;
   2147   1.53    itojun 		break;
   2148   1.53    itojun 	}
   2149   1.53    itojun 
   2150   1.53    itojun 	if (op == PRCO_SETOPT && m)
   2151   1.53    itojun 		(void)m_free(m);
   2152   1.53    itojun 
   2153   1.57    itojun 	return (error);
   2154    1.2    itojun }
   2155    1.2    itojun 
   2156   1.97    rpaulo #ifdef RFC2292
   2157    1.2    itojun /*
   2158   1.97    rpaulo  * Set up IP6 options in pcb for insertion in output packets or
   2159   1.97    rpaulo  * specifying behavior of outgoing packets.
   2160    1.2    itojun  */
   2161    1.2    itojun static int
   2162  1.119  christos ip6_pcbopts(struct ip6_pktopts **pktopt, struct mbuf *m, struct socket *so)
   2163    1.2    itojun {
   2164   1.31    itojun 	struct ip6_pktopts *opt = *pktopt;
   2165    1.2    itojun 	int error = 0;
   2166  1.101        ad 	struct lwp *l = curlwp;	/* XXX */
   2167    1.2    itojun 	int priv = 0;
   2168    1.2    itojun 
   2169    1.2    itojun 	/* turn off any old options. */
   2170    1.2    itojun 	if (opt) {
   2171   1.97    rpaulo #ifdef DIAGNOSTIC
   2172   1.97    rpaulo 	    if (opt->ip6po_pktinfo || opt->ip6po_nexthop ||
   2173   1.97    rpaulo 		opt->ip6po_hbh || opt->ip6po_dest1 || opt->ip6po_dest2 ||
   2174   1.97    rpaulo 		opt->ip6po_rhinfo.ip6po_rhi_rthdr)
   2175   1.97    rpaulo 		    printf("ip6_pcbopts: all specified options are cleared.\n");
   2176   1.97    rpaulo #endif
   2177   1.97    rpaulo 		ip6_clearpktopts(opt, -1);
   2178   1.19    itojun 	} else
   2179    1.2    itojun 		opt = malloc(sizeof(*opt), M_IP6OPT, M_WAITOK);
   2180   1.97    rpaulo 	*pktopt = NULL;
   2181    1.2    itojun 
   2182    1.2    itojun 	if (!m || m->m_len == 0) {
   2183    1.2    itojun 		/*
   2184   1.97    rpaulo 		 * Only turning off any previous options, regardless of
   2185   1.97    rpaulo 		 * whether the opt is just created or given.
   2186    1.2    itojun 		 */
   2187   1.59    itojun 		free(opt, M_IP6OPT);
   2188   1.57    itojun 		return (0);
   2189    1.2    itojun 	}
   2190    1.2    itojun 
   2191    1.2    itojun 	/*  set options specified by user. */
   2192  1.101        ad 	if (l && !kauth_authorize_generic(l->l_cred, KAUTH_GENERIC_ISSUSER,
   2193  1.111      elad 	    NULL))
   2194    1.2    itojun 		priv = 1;
   2195   1.97    rpaulo 	if ((error = ip6_setpktopts(m, opt, NULL, priv,
   2196   1.97    rpaulo 	    so->so_proto->pr_protocol)) != 0) {
   2197   1.97    rpaulo 		ip6_clearpktopts(opt, -1); /* XXX: discard all options */
   2198   1.59    itojun 		free(opt, M_IP6OPT);
   2199   1.57    itojun 		return (error);
   2200    1.2    itojun 	}
   2201    1.2    itojun 	*pktopt = opt;
   2202   1.57    itojun 	return (0);
   2203    1.2    itojun }
   2204   1.97    rpaulo #endif
   2205   1.97    rpaulo 
   2206   1.97    rpaulo /*
   2207   1.97    rpaulo  * initialize ip6_pktopts.  beware that there are non-zero default values in
   2208   1.97    rpaulo  * the struct.
   2209   1.97    rpaulo  */
   2210   1.97    rpaulo void
   2211   1.97    rpaulo ip6_initpktopts(struct ip6_pktopts *opt)
   2212   1.97    rpaulo {
   2213   1.97    rpaulo 
   2214   1.97    rpaulo 	memset(opt, 0, sizeof(*opt));
   2215   1.97    rpaulo 	opt->ip6po_hlim = -1;	/* -1 means default hop limit */
   2216   1.97    rpaulo 	opt->ip6po_tclass = -1;	/* -1 means default traffic class */
   2217   1.97    rpaulo 	opt->ip6po_minmtu = IP6PO_MINMTU_MCASTONLY;
   2218   1.97    rpaulo }
   2219   1.97    rpaulo 
   2220   1.97    rpaulo #define sin6tosa(sin6)	((struct sockaddr *)(sin6)) /* XXX */
   2221   1.97    rpaulo static int
   2222   1.97    rpaulo ip6_pcbopt(int optname, u_char *buf, int len, struct ip6_pktopts **pktopt,
   2223   1.97    rpaulo     int priv, int uproto)
   2224   1.97    rpaulo {
   2225   1.97    rpaulo 	struct ip6_pktopts *opt;
   2226   1.97    rpaulo 
   2227   1.97    rpaulo 	if (*pktopt == NULL) {
   2228   1.97    rpaulo 		*pktopt = malloc(sizeof(struct ip6_pktopts), M_IP6OPT,
   2229   1.97    rpaulo 		    M_WAITOK);
   2230   1.97    rpaulo 		ip6_initpktopts(*pktopt);
   2231   1.97    rpaulo 	}
   2232   1.97    rpaulo 	opt = *pktopt;
   2233   1.97    rpaulo 
   2234   1.97    rpaulo 	return (ip6_setpktopt(optname, buf, len, opt, priv, 1, 0, uproto));
   2235   1.97    rpaulo }
   2236   1.97    rpaulo 
   2237   1.97    rpaulo static int
   2238   1.97    rpaulo ip6_getpcbopt(struct ip6_pktopts *pktopt, int optname, struct mbuf **mp)
   2239   1.97    rpaulo {
   2240   1.97    rpaulo 	void *optdata = NULL;
   2241   1.97    rpaulo 	int optdatalen = 0;
   2242   1.97    rpaulo 	struct ip6_ext *ip6e;
   2243   1.97    rpaulo 	int error = 0;
   2244   1.97    rpaulo 	struct in6_pktinfo null_pktinfo;
   2245   1.97    rpaulo 	int deftclass = 0, on;
   2246   1.97    rpaulo 	int defminmtu = IP6PO_MINMTU_MCASTONLY;
   2247   1.97    rpaulo 	struct mbuf *m;
   2248   1.97    rpaulo 
   2249   1.97    rpaulo 	switch (optname) {
   2250   1.97    rpaulo 	case IPV6_PKTINFO:
   2251   1.97    rpaulo 		if (pktopt && pktopt->ip6po_pktinfo)
   2252   1.97    rpaulo 			optdata = (void *)pktopt->ip6po_pktinfo;
   2253   1.97    rpaulo 		else {
   2254   1.97    rpaulo 			/* XXX: we don't have to do this every time... */
   2255   1.97    rpaulo 			memset(&null_pktinfo, 0, sizeof(null_pktinfo));
   2256   1.97    rpaulo 			optdata = (void *)&null_pktinfo;
   2257   1.97    rpaulo 		}
   2258   1.97    rpaulo 		optdatalen = sizeof(struct in6_pktinfo);
   2259   1.97    rpaulo 		break;
   2260   1.97    rpaulo 	case IPV6_OTCLASS:
   2261   1.97    rpaulo 		/* XXX */
   2262   1.97    rpaulo 		return (EINVAL);
   2263   1.97    rpaulo 	case IPV6_TCLASS:
   2264   1.97    rpaulo 		if (pktopt && pktopt->ip6po_tclass >= 0)
   2265   1.97    rpaulo 			optdata = (void *)&pktopt->ip6po_tclass;
   2266   1.97    rpaulo 		else
   2267   1.97    rpaulo 			optdata = (void *)&deftclass;
   2268   1.97    rpaulo 		optdatalen = sizeof(int);
   2269   1.97    rpaulo 		break;
   2270   1.97    rpaulo 	case IPV6_HOPOPTS:
   2271   1.97    rpaulo 		if (pktopt && pktopt->ip6po_hbh) {
   2272   1.97    rpaulo 			optdata = (void *)pktopt->ip6po_hbh;
   2273   1.97    rpaulo 			ip6e = (struct ip6_ext *)pktopt->ip6po_hbh;
   2274   1.97    rpaulo 			optdatalen = (ip6e->ip6e_len + 1) << 3;
   2275   1.97    rpaulo 		}
   2276   1.97    rpaulo 		break;
   2277   1.97    rpaulo 	case IPV6_RTHDR:
   2278   1.97    rpaulo 		if (pktopt && pktopt->ip6po_rthdr) {
   2279   1.97    rpaulo 			optdata = (void *)pktopt->ip6po_rthdr;
   2280   1.97    rpaulo 			ip6e = (struct ip6_ext *)pktopt->ip6po_rthdr;
   2281   1.97    rpaulo 			optdatalen = (ip6e->ip6e_len + 1) << 3;
   2282   1.97    rpaulo 		}
   2283   1.97    rpaulo 		break;
   2284   1.97    rpaulo 	case IPV6_RTHDRDSTOPTS:
   2285   1.97    rpaulo 		if (pktopt && pktopt->ip6po_dest1) {
   2286   1.97    rpaulo 			optdata = (void *)pktopt->ip6po_dest1;
   2287   1.97    rpaulo 			ip6e = (struct ip6_ext *)pktopt->ip6po_dest1;
   2288   1.97    rpaulo 			optdatalen = (ip6e->ip6e_len + 1) << 3;
   2289   1.97    rpaulo 		}
   2290   1.97    rpaulo 		break;
   2291   1.97    rpaulo 	case IPV6_DSTOPTS:
   2292   1.97    rpaulo 		if (pktopt && pktopt->ip6po_dest2) {
   2293   1.97    rpaulo 			optdata = (void *)pktopt->ip6po_dest2;
   2294   1.97    rpaulo 			ip6e = (struct ip6_ext *)pktopt->ip6po_dest2;
   2295   1.97    rpaulo 			optdatalen = (ip6e->ip6e_len + 1) << 3;
   2296   1.97    rpaulo 		}
   2297   1.97    rpaulo 		break;
   2298   1.97    rpaulo 	case IPV6_NEXTHOP:
   2299   1.97    rpaulo 		if (pktopt && pktopt->ip6po_nexthop) {
   2300   1.97    rpaulo 			optdata = (void *)pktopt->ip6po_nexthop;
   2301   1.97    rpaulo 			optdatalen = pktopt->ip6po_nexthop->sa_len;
   2302   1.97    rpaulo 		}
   2303   1.97    rpaulo 		break;
   2304   1.97    rpaulo 	case IPV6_USE_MIN_MTU:
   2305   1.97    rpaulo 		if (pktopt)
   2306   1.97    rpaulo 			optdata = (void *)&pktopt->ip6po_minmtu;
   2307   1.97    rpaulo 		else
   2308   1.97    rpaulo 			optdata = (void *)&defminmtu;
   2309   1.97    rpaulo 		optdatalen = sizeof(int);
   2310   1.97    rpaulo 		break;
   2311   1.97    rpaulo 	case IPV6_DONTFRAG:
   2312   1.97    rpaulo 		if (pktopt && ((pktopt->ip6po_flags) & IP6PO_DONTFRAG))
   2313   1.97    rpaulo 			on = 1;
   2314   1.97    rpaulo 		else
   2315   1.97    rpaulo 			on = 0;
   2316   1.97    rpaulo 		optdata = (void *)&on;
   2317   1.97    rpaulo 		optdatalen = sizeof(on);
   2318   1.97    rpaulo 		break;
   2319   1.97    rpaulo 	default:		/* should not happen */
   2320   1.97    rpaulo #ifdef DIAGNOSTIC
   2321   1.97    rpaulo 		panic("ip6_getpcbopt: unexpected option\n");
   2322   1.97    rpaulo #endif
   2323   1.97    rpaulo 		return (ENOPROTOOPT);
   2324   1.97    rpaulo 	}
   2325   1.97    rpaulo 
   2326   1.97    rpaulo 	if (optdatalen > MCLBYTES)
   2327   1.97    rpaulo 		return (EMSGSIZE); /* XXX */
   2328   1.97    rpaulo 	*mp = m = m_get(M_WAIT, MT_SOOPTS);
   2329   1.97    rpaulo 	if (optdatalen > MLEN)
   2330   1.97    rpaulo 		MCLGET(m, M_WAIT);
   2331   1.97    rpaulo 	m->m_len = optdatalen;
   2332   1.97    rpaulo 	if (optdatalen)
   2333   1.97    rpaulo 		memcpy(mtod(m, void *), optdata, optdatalen);
   2334   1.97    rpaulo 
   2335   1.97    rpaulo 	return (error);
   2336   1.97    rpaulo }
   2337   1.97    rpaulo 
   2338   1.97    rpaulo void
   2339   1.97    rpaulo ip6_clearpktopts(struct ip6_pktopts *pktopt, int optname)
   2340   1.97    rpaulo {
   2341   1.97    rpaulo 	if (optname == -1 || optname == IPV6_PKTINFO) {
   2342   1.97    rpaulo 		if (pktopt->ip6po_pktinfo)
   2343   1.97    rpaulo 			free(pktopt->ip6po_pktinfo, M_IP6OPT);
   2344   1.97    rpaulo 		pktopt->ip6po_pktinfo = NULL;
   2345   1.97    rpaulo 	}
   2346   1.97    rpaulo 	if (optname == -1 || optname == IPV6_HOPLIMIT)
   2347   1.97    rpaulo 		pktopt->ip6po_hlim = -1;
   2348   1.97    rpaulo 	if (optname == -1 || optname == IPV6_TCLASS)
   2349   1.97    rpaulo 		pktopt->ip6po_tclass = -1;
   2350   1.97    rpaulo 	if (optname == -1 || optname == IPV6_NEXTHOP) {
   2351  1.118    dyoung 		rtcache_free(&pktopt->ip6po_nextroute);
   2352   1.97    rpaulo 		if (pktopt->ip6po_nexthop)
   2353   1.97    rpaulo 			free(pktopt->ip6po_nexthop, M_IP6OPT);
   2354   1.97    rpaulo 		pktopt->ip6po_nexthop = NULL;
   2355   1.97    rpaulo 	}
   2356   1.97    rpaulo 	if (optname == -1 || optname == IPV6_HOPOPTS) {
   2357   1.97    rpaulo 		if (pktopt->ip6po_hbh)
   2358   1.97    rpaulo 			free(pktopt->ip6po_hbh, M_IP6OPT);
   2359   1.97    rpaulo 		pktopt->ip6po_hbh = NULL;
   2360   1.97    rpaulo 	}
   2361   1.97    rpaulo 	if (optname == -1 || optname == IPV6_RTHDRDSTOPTS) {
   2362   1.97    rpaulo 		if (pktopt->ip6po_dest1)
   2363   1.97    rpaulo 			free(pktopt->ip6po_dest1, M_IP6OPT);
   2364   1.97    rpaulo 		pktopt->ip6po_dest1 = NULL;
   2365   1.97    rpaulo 	}
   2366   1.97    rpaulo 	if (optname == -1 || optname == IPV6_RTHDR) {
   2367   1.97    rpaulo 		if (pktopt->ip6po_rhinfo.ip6po_rhi_rthdr)
   2368   1.97    rpaulo 			free(pktopt->ip6po_rhinfo.ip6po_rhi_rthdr, M_IP6OPT);
   2369   1.97    rpaulo 		pktopt->ip6po_rhinfo.ip6po_rhi_rthdr = NULL;
   2370  1.118    dyoung 		rtcache_free(&pktopt->ip6po_route);
   2371   1.97    rpaulo 	}
   2372   1.97    rpaulo 	if (optname == -1 || optname == IPV6_DSTOPTS) {
   2373   1.97    rpaulo 		if (pktopt->ip6po_dest2)
   2374   1.97    rpaulo 			free(pktopt->ip6po_dest2, M_IP6OPT);
   2375   1.97    rpaulo 		pktopt->ip6po_dest2 = NULL;
   2376   1.97    rpaulo 	}
   2377   1.97    rpaulo }
   2378   1.97    rpaulo 
   2379   1.97    rpaulo #define PKTOPT_EXTHDRCPY(type) 					\
   2380   1.97    rpaulo do {								\
   2381   1.97    rpaulo 	if (src->type) {					\
   2382   1.97    rpaulo 		int hlen = (((struct ip6_ext *)src->type)->ip6e_len + 1) << 3;\
   2383   1.97    rpaulo 		dst->type = malloc(hlen, M_IP6OPT, canwait);	\
   2384   1.97    rpaulo 		if (dst->type == NULL && canwait == M_NOWAIT)	\
   2385   1.97    rpaulo 			goto bad;				\
   2386   1.97    rpaulo 		memcpy(dst->type, src->type, hlen);		\
   2387   1.97    rpaulo 	}							\
   2388   1.97    rpaulo } while (/*CONSTCOND*/ 0)
   2389   1.97    rpaulo 
   2390   1.97    rpaulo static int
   2391   1.97    rpaulo copypktopts(struct ip6_pktopts *dst, struct ip6_pktopts *src, int canwait)
   2392   1.97    rpaulo {
   2393   1.97    rpaulo 	dst->ip6po_hlim = src->ip6po_hlim;
   2394   1.97    rpaulo 	dst->ip6po_tclass = src->ip6po_tclass;
   2395   1.97    rpaulo 	dst->ip6po_flags = src->ip6po_flags;
   2396   1.97    rpaulo 	if (src->ip6po_pktinfo) {
   2397   1.97    rpaulo 		dst->ip6po_pktinfo = malloc(sizeof(*dst->ip6po_pktinfo),
   2398   1.97    rpaulo 		    M_IP6OPT, canwait);
   2399   1.97    rpaulo 		if (dst->ip6po_pktinfo == NULL && canwait == M_NOWAIT)
   2400   1.97    rpaulo 			goto bad;
   2401   1.97    rpaulo 		*dst->ip6po_pktinfo = *src->ip6po_pktinfo;
   2402   1.97    rpaulo 	}
   2403   1.97    rpaulo 	if (src->ip6po_nexthop) {
   2404   1.97    rpaulo 		dst->ip6po_nexthop = malloc(src->ip6po_nexthop->sa_len,
   2405   1.97    rpaulo 		    M_IP6OPT, canwait);
   2406   1.97    rpaulo 		if (dst->ip6po_nexthop == NULL && canwait == M_NOWAIT)
   2407   1.97    rpaulo 			goto bad;
   2408   1.97    rpaulo 		memcpy(dst->ip6po_nexthop, src->ip6po_nexthop,
   2409   1.97    rpaulo 		    src->ip6po_nexthop->sa_len);
   2410   1.97    rpaulo 	}
   2411   1.97    rpaulo 	PKTOPT_EXTHDRCPY(ip6po_hbh);
   2412   1.97    rpaulo 	PKTOPT_EXTHDRCPY(ip6po_dest1);
   2413   1.97    rpaulo 	PKTOPT_EXTHDRCPY(ip6po_dest2);
   2414   1.97    rpaulo 	PKTOPT_EXTHDRCPY(ip6po_rthdr); /* not copy the cached route */
   2415   1.97    rpaulo 	return (0);
   2416   1.97    rpaulo 
   2417   1.97    rpaulo   bad:
   2418   1.97    rpaulo 	if (dst->ip6po_pktinfo) free(dst->ip6po_pktinfo, M_IP6OPT);
   2419   1.97    rpaulo 	if (dst->ip6po_nexthop) free(dst->ip6po_nexthop, M_IP6OPT);
   2420   1.97    rpaulo 	if (dst->ip6po_hbh) free(dst->ip6po_hbh, M_IP6OPT);
   2421   1.97    rpaulo 	if (dst->ip6po_dest1) free(dst->ip6po_dest1, M_IP6OPT);
   2422   1.97    rpaulo 	if (dst->ip6po_dest2) free(dst->ip6po_dest2, M_IP6OPT);
   2423   1.97    rpaulo 	if (dst->ip6po_rthdr) free(dst->ip6po_rthdr, M_IP6OPT);
   2424   1.97    rpaulo 
   2425   1.97    rpaulo 	return (ENOBUFS);
   2426   1.97    rpaulo }
   2427   1.97    rpaulo #undef PKTOPT_EXTHDRCPY
   2428   1.97    rpaulo 
   2429   1.97    rpaulo struct ip6_pktopts *
   2430   1.97    rpaulo ip6_copypktopts(struct ip6_pktopts *src, int canwait)
   2431   1.97    rpaulo {
   2432   1.97    rpaulo 	int error;
   2433   1.97    rpaulo 	struct ip6_pktopts *dst;
   2434   1.97    rpaulo 
   2435   1.97    rpaulo 	dst = malloc(sizeof(*dst), M_IP6OPT, canwait);
   2436   1.97    rpaulo 	if (dst == NULL && canwait == M_NOWAIT)
   2437   1.97    rpaulo 		return (NULL);
   2438   1.97    rpaulo 	ip6_initpktopts(dst);
   2439   1.97    rpaulo 
   2440   1.97    rpaulo 	if ((error = copypktopts(dst, src, canwait)) != 0) {
   2441   1.97    rpaulo 		free(dst, M_IP6OPT);
   2442   1.97    rpaulo 		return (NULL);
   2443   1.97    rpaulo 	}
   2444   1.97    rpaulo 
   2445   1.97    rpaulo 	return (dst);
   2446   1.97    rpaulo }
   2447   1.97    rpaulo 
   2448   1.97    rpaulo void
   2449   1.97    rpaulo ip6_freepcbopts(struct ip6_pktopts *pktopt)
   2450   1.97    rpaulo {
   2451   1.97    rpaulo 	if (pktopt == NULL)
   2452   1.97    rpaulo 		return;
   2453   1.97    rpaulo 
   2454   1.97    rpaulo 	ip6_clearpktopts(pktopt, -1);
   2455   1.97    rpaulo 
   2456   1.97    rpaulo 	free(pktopt, M_IP6OPT);
   2457   1.97    rpaulo }
   2458    1.2    itojun 
   2459    1.2    itojun /*
   2460    1.2    itojun  * Set the IP6 multicast options in response to user setsockopt().
   2461    1.2    itojun  */
   2462    1.2    itojun static int
   2463  1.119  christos ip6_setmoptions(int optname, struct ip6_moptions **im6op, struct mbuf *m)
   2464    1.2    itojun {
   2465    1.2    itojun 	int error = 0;
   2466    1.2    itojun 	u_int loop, ifindex;
   2467    1.2    itojun 	struct ipv6_mreq *mreq;
   2468    1.2    itojun 	struct ifnet *ifp;
   2469    1.2    itojun 	struct ip6_moptions *im6o = *im6op;
   2470  1.118    dyoung 	struct route ro;
   2471    1.2    itojun 	struct in6_multi_mship *imm;
   2472  1.101        ad 	struct lwp *l = curlwp;	/* XXX */
   2473    1.2    itojun 
   2474    1.2    itojun 	if (im6o == NULL) {
   2475    1.2    itojun 		/*
   2476    1.2    itojun 		 * No multicast option buffer attached to the pcb;
   2477    1.2    itojun 		 * allocate one and initialize to default values.
   2478    1.2    itojun 		 */
   2479    1.2    itojun 		im6o = (struct ip6_moptions *)
   2480    1.2    itojun 			malloc(sizeof(*im6o), M_IPMOPTS, M_WAITOK);
   2481    1.2    itojun 
   2482    1.2    itojun 		if (im6o == NULL)
   2483   1.57    itojun 			return (ENOBUFS);
   2484    1.2    itojun 		*im6op = im6o;
   2485    1.2    itojun 		im6o->im6o_multicast_ifp = NULL;
   2486    1.2    itojun 		im6o->im6o_multicast_hlim = ip6_defmcasthlim;
   2487    1.2    itojun 		im6o->im6o_multicast_loop = IPV6_DEFAULT_MULTICAST_LOOP;
   2488    1.2    itojun 		LIST_INIT(&im6o->im6o_memberships);
   2489    1.2    itojun 	}
   2490    1.2    itojun 
   2491    1.2    itojun 	switch (optname) {
   2492    1.2    itojun 
   2493    1.2    itojun 	case IPV6_MULTICAST_IF:
   2494    1.2    itojun 		/*
   2495    1.2    itojun 		 * Select the interface for outgoing multicast packets.
   2496    1.2    itojun 		 */
   2497    1.2    itojun 		if (m == NULL || m->m_len != sizeof(u_int)) {
   2498    1.2    itojun 			error = EINVAL;
   2499    1.2    itojun 			break;
   2500    1.2    itojun 		}
   2501   1.25    itojun 		bcopy(mtod(m, u_int *), &ifindex, sizeof(ifindex));
   2502   1.87  drochner 		if (ifindex != 0) {
   2503  1.102  christos 			if (if_indexlim <= ifindex || !ifindex2ifnet[ifindex]) {
   2504   1.87  drochner 				error = ENXIO;	/* XXX EINVAL? */
   2505   1.87  drochner 				break;
   2506   1.87  drochner 			}
   2507   1.87  drochner 			ifp = ifindex2ifnet[ifindex];
   2508   1.87  drochner 			if ((ifp->if_flags & IFF_MULTICAST) == 0) {
   2509   1.87  drochner 				error = EADDRNOTAVAIL;
   2510   1.87  drochner 				break;
   2511   1.87  drochner 			}
   2512   1.87  drochner 		} else
   2513   1.87  drochner 			ifp = NULL;
   2514    1.2    itojun 		im6o->im6o_multicast_ifp = ifp;
   2515    1.2    itojun 		break;
   2516    1.2    itojun 
   2517    1.2    itojun 	case IPV6_MULTICAST_HOPS:
   2518    1.2    itojun 	    {
   2519    1.2    itojun 		/*
   2520    1.2    itojun 		 * Set the IP6 hoplimit for outgoing multicast packets.
   2521    1.2    itojun 		 */
   2522    1.2    itojun 		int optval;
   2523    1.2    itojun 		if (m == NULL || m->m_len != sizeof(int)) {
   2524    1.2    itojun 			error = EINVAL;
   2525    1.2    itojun 			break;
   2526    1.2    itojun 		}
   2527   1.25    itojun 		bcopy(mtod(m, u_int *), &optval, sizeof(optval));
   2528    1.2    itojun 		if (optval < -1 || optval >= 256)
   2529    1.2    itojun 			error = EINVAL;
   2530    1.2    itojun 		else if (optval == -1)
   2531    1.2    itojun 			im6o->im6o_multicast_hlim = ip6_defmcasthlim;
   2532    1.2    itojun 		else
   2533    1.2    itojun 			im6o->im6o_multicast_hlim = optval;
   2534    1.2    itojun 		break;
   2535    1.2    itojun 	    }
   2536    1.2    itojun 
   2537    1.2    itojun 	case IPV6_MULTICAST_LOOP:
   2538    1.2    itojun 		/*
   2539    1.2    itojun 		 * Set the loopback flag for outgoing multicast packets.
   2540    1.2    itojun 		 * Must be zero or one.
   2541    1.2    itojun 		 */
   2542   1.25    itojun 		if (m == NULL || m->m_len != sizeof(u_int)) {
   2543   1.25    itojun 			error = EINVAL;
   2544   1.25    itojun 			break;
   2545   1.25    itojun 		}
   2546   1.25    itojun 		bcopy(mtod(m, u_int *), &loop, sizeof(loop));
   2547   1.25    itojun 		if (loop > 1) {
   2548    1.2    itojun 			error = EINVAL;
   2549    1.2    itojun 			break;
   2550    1.2    itojun 		}
   2551    1.2    itojun 		im6o->im6o_multicast_loop = loop;
   2552    1.2    itojun 		break;
   2553    1.2    itojun 
   2554    1.2    itojun 	case IPV6_JOIN_GROUP:
   2555    1.2    itojun 		/*
   2556    1.2    itojun 		 * Add a multicast group membership.
   2557    1.2    itojun 		 * Group must be a valid IP6 multicast address.
   2558    1.2    itojun 		 */
   2559    1.2    itojun 		if (m == NULL || m->m_len != sizeof(struct ipv6_mreq)) {
   2560    1.2    itojun 			error = EINVAL;
   2561    1.2    itojun 			break;
   2562    1.2    itojun 		}
   2563    1.2    itojun 		mreq = mtod(m, struct ipv6_mreq *);
   2564    1.9    itojun 		if (IN6_IS_ADDR_UNSPECIFIED(&mreq->ipv6mr_multiaddr)) {
   2565    1.2    itojun 			/*
   2566    1.2    itojun 			 * We use the unspecified address to specify to accept
   2567    1.2    itojun 			 * all multicast addresses. Only super user is allowed
   2568    1.2    itojun 			 * to do this.
   2569    1.2    itojun 			 */
   2570  1.101        ad 			if (kauth_authorize_generic(l->l_cred,
   2571  1.111      elad 			    KAUTH_GENERIC_ISSUSER, NULL))
   2572   1.31    itojun 			{
   2573    1.2    itojun 				error = EACCES;
   2574    1.2    itojun 				break;
   2575    1.2    itojun 			}
   2576    1.2    itojun 		} else if (!IN6_IS_ADDR_MULTICAST(&mreq->ipv6mr_multiaddr)) {
   2577    1.2    itojun 			error = EINVAL;
   2578    1.2    itojun 			break;
   2579    1.2    itojun 		}
   2580    1.2    itojun 
   2581    1.2    itojun 		/*
   2582    1.2    itojun 		 * If no interface was explicitly specified, choose an
   2583    1.2    itojun 		 * appropriate one according to the given multicast address.
   2584    1.2    itojun 		 */
   2585   1.94    rpaulo 		if (mreq->ipv6mr_interface == 0) {
   2586  1.124    dyoung 			struct rtentry *rt;
   2587  1.118    dyoung 			union {
   2588  1.118    dyoung 				struct sockaddr		dst;
   2589  1.118    dyoung 				struct sockaddr_in6	dst6;
   2590  1.118    dyoung 			} u;
   2591   1.94    rpaulo 
   2592   1.94    rpaulo 			/*
   2593   1.94    rpaulo 			 * Look up the routing table for the
   2594   1.94    rpaulo 			 * address, and choose the outgoing interface.
   2595   1.94    rpaulo 			 *   XXX: is it a good approach?
   2596   1.94    rpaulo 			 */
   2597  1.113    dyoung 			memset(&ro, 0, sizeof(ro));
   2598  1.118    dyoung 			sockaddr_in6_init(&u.dst6, &mreq->ipv6mr_multiaddr, 0,
   2599  1.118    dyoung 			    0, 0);
   2600  1.118    dyoung 			rtcache_setdst(&ro, &u.dst);
   2601  1.118    dyoung 			rtcache_init(&ro);
   2602  1.124    dyoung 			ifp = (rt = rtcache_getrt(&ro)) != NULL ? rt->rt_ifp
   2603  1.124    dyoung 			                                        : NULL;
   2604  1.118    dyoung 			rtcache_free(&ro);
   2605   1.94    rpaulo 		} else {
   2606   1.94    rpaulo 			/*
   2607   1.94    rpaulo 			 * If the interface is specified, validate it.
   2608   1.94    rpaulo 			 */
   2609  1.102  christos 			if (if_indexlim <= mreq->ipv6mr_interface ||
   2610   1.87  drochner 			    !ifindex2ifnet[mreq->ipv6mr_interface]) {
   2611   1.87  drochner 				error = ENXIO;	/* XXX EINVAL? */
   2612   1.87  drochner 				break;
   2613   1.87  drochner 			}
   2614   1.87  drochner 			ifp = ifindex2ifnet[mreq->ipv6mr_interface];
   2615   1.87  drochner 		}
   2616    1.2    itojun 
   2617    1.2    itojun 		/*
   2618    1.2    itojun 		 * See if we found an interface, and confirm that it
   2619    1.2    itojun 		 * supports multicast
   2620    1.2    itojun 		 */
   2621    1.2    itojun 		if (ifp == NULL || (ifp->if_flags & IFF_MULTICAST) == 0) {
   2622    1.2    itojun 			error = EADDRNOTAVAIL;
   2623    1.2    itojun 			break;
   2624    1.2    itojun 		}
   2625   1.94    rpaulo 
   2626   1.94    rpaulo 		if (in6_setscope(&mreq->ipv6mr_multiaddr, ifp, NULL)) {
   2627   1.94    rpaulo 			error = EADDRNOTAVAIL; /* XXX: should not happen */
   2628   1.94    rpaulo 			break;
   2629    1.2    itojun 		}
   2630   1.94    rpaulo 
   2631    1.2    itojun 		/*
   2632    1.2    itojun 		 * See if the membership already exists.
   2633    1.2    itojun 		 */
   2634    1.2    itojun 		for (imm = im6o->im6o_memberships.lh_first;
   2635    1.2    itojun 		     imm != NULL; imm = imm->i6mm_chain.le_next)
   2636    1.2    itojun 			if (imm->i6mm_maddr->in6m_ifp == ifp &&
   2637    1.2    itojun 			    IN6_ARE_ADDR_EQUAL(&imm->i6mm_maddr->in6m_addr,
   2638   1.49    itojun 			    &mreq->ipv6mr_multiaddr))
   2639    1.2    itojun 				break;
   2640    1.2    itojun 		if (imm != NULL) {
   2641    1.2    itojun 			error = EADDRINUSE;
   2642    1.2    itojun 			break;
   2643    1.2    itojun 		}
   2644    1.2    itojun 		/*
   2645    1.2    itojun 		 * Everything looks good; add a new record to the multicast
   2646    1.2    itojun 		 * address list for the given interface.
   2647    1.2    itojun 		 */
   2648   1.95    rpaulo 		imm = in6_joingroup(ifp, &mreq->ipv6mr_multiaddr, &error, 0);
   2649   1.95    rpaulo 		if (imm == NULL)
   2650    1.2    itojun 			break;
   2651    1.2    itojun 		LIST_INSERT_HEAD(&im6o->im6o_memberships, imm, i6mm_chain);
   2652    1.2    itojun 		break;
   2653    1.2    itojun 
   2654    1.2    itojun 	case IPV6_LEAVE_GROUP:
   2655    1.2    itojun 		/*
   2656    1.2    itojun 		 * Drop a multicast group membership.
   2657    1.2    itojun 		 * Group must be a valid IP6 multicast address.
   2658    1.2    itojun 		 */
   2659    1.2    itojun 		if (m == NULL || m->m_len != sizeof(struct ipv6_mreq)) {
   2660    1.2    itojun 			error = EINVAL;
   2661    1.2    itojun 			break;
   2662    1.2    itojun 		}
   2663    1.2    itojun 		mreq = mtod(m, struct ipv6_mreq *);
   2664   1.94    rpaulo 
   2665    1.2    itojun 		/*
   2666    1.2    itojun 		 * If an interface address was specified, get a pointer
   2667    1.2    itojun 		 * to its ifnet structure.
   2668    1.2    itojun 		 */
   2669   1.87  drochner 		if (mreq->ipv6mr_interface != 0) {
   2670  1.102  christos 			if (if_indexlim <= mreq->ipv6mr_interface ||
   2671   1.87  drochner 			    !ifindex2ifnet[mreq->ipv6mr_interface]) {
   2672   1.87  drochner 				error = ENXIO;	/* XXX EINVAL? */
   2673   1.87  drochner 				break;
   2674   1.87  drochner 			}
   2675   1.87  drochner 			ifp = ifindex2ifnet[mreq->ipv6mr_interface];
   2676   1.87  drochner 		} else
   2677   1.87  drochner 			ifp = NULL;
   2678   1.94    rpaulo 
   2679   1.94    rpaulo 		/* Fill in the scope zone ID */
   2680   1.94    rpaulo 		if (ifp) {
   2681   1.94    rpaulo 			if (in6_setscope(&mreq->ipv6mr_multiaddr, ifp, NULL)) {
   2682   1.94    rpaulo 				/* XXX: should not happen */
   2683   1.94    rpaulo 				error = EADDRNOTAVAIL;
   2684   1.94    rpaulo 				break;
   2685   1.94    rpaulo 			}
   2686   1.94    rpaulo 		} else if (mreq->ipv6mr_interface != 0) {
   2687   1.94    rpaulo 			/*
   2688   1.94    rpaulo 			 * XXX: This case would happens when the (positive)
   2689   1.94    rpaulo 			 * index is in the valid range, but the corresponding
   2690   1.94    rpaulo 			 * interface has been detached dynamically.  The above
   2691   1.94    rpaulo 			 * check probably avoids such case to happen here, but
   2692   1.94    rpaulo 			 * we check it explicitly for safety.
   2693   1.94    rpaulo 			 */
   2694   1.94    rpaulo 			error = EADDRNOTAVAIL;
   2695   1.94    rpaulo 			break;
   2696   1.94    rpaulo 		} else {	/* ipv6mr_interface == 0 */
   2697   1.94    rpaulo 			struct sockaddr_in6 sa6_mc;
   2698   1.94    rpaulo 
   2699   1.94    rpaulo 			/*
   2700   1.94    rpaulo 			 * The API spec says as follows:
   2701   1.94    rpaulo 			 *  If the interface index is specified as 0, the
   2702   1.94    rpaulo 			 *  system may choose a multicast group membership to
   2703   1.94    rpaulo 			 *  drop by matching the multicast address only.
   2704   1.94    rpaulo 			 * On the other hand, we cannot disambiguate the scope
   2705   1.94    rpaulo 			 * zone unless an interface is provided.  Thus, we
   2706   1.94    rpaulo 			 * check if there's ambiguity with the default scope
   2707   1.94    rpaulo 			 * zone as the last resort.
   2708   1.94    rpaulo 			 */
   2709  1.123    dyoung 			sockaddr_in6_init(&sa6_mc, &mreq->ipv6mr_multiaddr,
   2710  1.123    dyoung 			    0, 0, 0);
   2711   1.94    rpaulo 			error = sa6_embedscope(&sa6_mc, ip6_use_defzone);
   2712   1.94    rpaulo 			if (error != 0)
   2713   1.94    rpaulo 				break;
   2714   1.94    rpaulo 			mreq->ipv6mr_multiaddr = sa6_mc.sin6_addr;
   2715    1.2    itojun 		}
   2716   1.94    rpaulo 
   2717    1.2    itojun 		/*
   2718    1.2    itojun 		 * Find the membership in the membership list.
   2719    1.2    itojun 		 */
   2720    1.2    itojun 		for (imm = im6o->im6o_memberships.lh_first;
   2721    1.2    itojun 		     imm != NULL; imm = imm->i6mm_chain.le_next) {
   2722   1.49    itojun 			if ((ifp == NULL || imm->i6mm_maddr->in6m_ifp == ifp) &&
   2723    1.2    itojun 			    IN6_ARE_ADDR_EQUAL(&imm->i6mm_maddr->in6m_addr,
   2724   1.49    itojun 			    &mreq->ipv6mr_multiaddr))
   2725    1.2    itojun 				break;
   2726    1.2    itojun 		}
   2727    1.2    itojun 		if (imm == NULL) {
   2728    1.2    itojun 			/* Unable to resolve interface */
   2729    1.2    itojun 			error = EADDRNOTAVAIL;
   2730    1.2    itojun 			break;
   2731    1.2    itojun 		}
   2732    1.2    itojun 		/*
   2733    1.2    itojun 		 * Give up the multicast address record to which the
   2734    1.2    itojun 		 * membership points.
   2735    1.2    itojun 		 */
   2736    1.2    itojun 		LIST_REMOVE(imm, i6mm_chain);
   2737   1.43    itojun 		in6_leavegroup(imm);
   2738    1.2    itojun 		break;
   2739    1.2    itojun 
   2740    1.2    itojun 	default:
   2741    1.2    itojun 		error = EOPNOTSUPP;
   2742    1.2    itojun 		break;
   2743    1.2    itojun 	}
   2744    1.2    itojun 
   2745    1.2    itojun 	/*
   2746    1.2    itojun 	 * If all options have default values, no need to keep the mbuf.
   2747    1.2    itojun 	 */
   2748    1.2    itojun 	if (im6o->im6o_multicast_ifp == NULL &&
   2749    1.2    itojun 	    im6o->im6o_multicast_hlim == ip6_defmcasthlim &&
   2750    1.2    itojun 	    im6o->im6o_multicast_loop == IPV6_DEFAULT_MULTICAST_LOOP &&
   2751    1.2    itojun 	    im6o->im6o_memberships.lh_first == NULL) {
   2752    1.2    itojun 		free(*im6op, M_IPMOPTS);
   2753    1.2    itojun 		*im6op = NULL;
   2754    1.2    itojun 	}
   2755    1.2    itojun 
   2756   1.57    itojun 	return (error);
   2757    1.2    itojun }
   2758    1.2    itojun 
   2759    1.2    itojun /*
   2760    1.2    itojun  * Return the IP6 multicast options in response to user getsockopt().
   2761    1.2    itojun  */
   2762    1.2    itojun static int
   2763  1.119  christos ip6_getmoptions(int optname, struct ip6_moptions *im6o, struct mbuf **mp)
   2764    1.2    itojun {
   2765    1.2    itojun 	u_int *hlim, *loop, *ifindex;
   2766    1.2    itojun 
   2767    1.2    itojun 	*mp = m_get(M_WAIT, MT_SOOPTS);
   2768    1.2    itojun 
   2769    1.2    itojun 	switch (optname) {
   2770    1.2    itojun 
   2771    1.2    itojun 	case IPV6_MULTICAST_IF:
   2772    1.2    itojun 		ifindex = mtod(*mp, u_int *);
   2773    1.2    itojun 		(*mp)->m_len = sizeof(u_int);
   2774    1.2    itojun 		if (im6o == NULL || im6o->im6o_multicast_ifp == NULL)
   2775    1.2    itojun 			*ifindex = 0;
   2776    1.2    itojun 		else
   2777    1.2    itojun 			*ifindex = im6o->im6o_multicast_ifp->if_index;
   2778   1.57    itojun 		return (0);
   2779    1.2    itojun 
   2780    1.2    itojun 	case IPV6_MULTICAST_HOPS:
   2781    1.2    itojun 		hlim = mtod(*mp, u_int *);
   2782    1.2    itojun 		(*mp)->m_len = sizeof(u_int);
   2783    1.2    itojun 		if (im6o == NULL)
   2784    1.2    itojun 			*hlim = ip6_defmcasthlim;
   2785    1.2    itojun 		else
   2786    1.2    itojun 			*hlim = im6o->im6o_multicast_hlim;
   2787   1.57    itojun 		return (0);
   2788    1.2    itojun 
   2789    1.2    itojun 	case IPV6_MULTICAST_LOOP:
   2790    1.2    itojun 		loop = mtod(*mp, u_int *);
   2791    1.2    itojun 		(*mp)->m_len = sizeof(u_int);
   2792    1.2    itojun 		if (im6o == NULL)
   2793    1.2    itojun 			*loop = ip6_defmcasthlim;
   2794    1.2    itojun 		else
   2795    1.2    itojun 			*loop = im6o->im6o_multicast_loop;
   2796   1.57    itojun 		return (0);
   2797    1.2    itojun 
   2798    1.2    itojun 	default:
   2799   1.57    itojun 		return (EOPNOTSUPP);
   2800    1.2    itojun 	}
   2801    1.2    itojun }
   2802    1.2    itojun 
   2803    1.2    itojun /*
   2804    1.2    itojun  * Discard the IP6 multicast options.
   2805    1.2    itojun  */
   2806    1.2    itojun void
   2807  1.119  christos ip6_freemoptions(struct ip6_moptions *im6o)
   2808    1.2    itojun {
   2809    1.2    itojun 	struct in6_multi_mship *imm;
   2810    1.2    itojun 
   2811    1.2    itojun 	if (im6o == NULL)
   2812    1.2    itojun 		return;
   2813    1.2    itojun 
   2814    1.2    itojun 	while ((imm = im6o->im6o_memberships.lh_first) != NULL) {
   2815    1.2    itojun 		LIST_REMOVE(imm, i6mm_chain);
   2816   1.43    itojun 		in6_leavegroup(imm);
   2817    1.2    itojun 	}
   2818    1.2    itojun 	free(im6o, M_IPMOPTS);
   2819    1.2    itojun }
   2820    1.2    itojun 
   2821    1.2    itojun /*
   2822    1.2    itojun  * Set IPv6 outgoing packet options based on advanced API.
   2823    1.2    itojun  */
   2824    1.2    itojun int
   2825  1.119  christos ip6_setpktopts(struct mbuf *control, struct ip6_pktopts *opt,
   2826  1.119  christos 	struct ip6_pktopts *stickyopt, int priv, int uproto)
   2827    1.2    itojun {
   2828   1.31    itojun 	struct cmsghdr *cm = 0;
   2829    1.2    itojun 
   2830   1.97    rpaulo 	if (control == NULL || opt == NULL)
   2831   1.57    itojun 		return (EINVAL);
   2832    1.2    itojun 
   2833   1.97    rpaulo 	ip6_initpktopts(opt);
   2834   1.97    rpaulo 	if (stickyopt) {
   2835   1.97    rpaulo 		int error;
   2836   1.97    rpaulo 
   2837   1.97    rpaulo 		/*
   2838   1.97    rpaulo 		 * If stickyopt is provided, make a local copy of the options
   2839   1.97    rpaulo 		 * for this particular packet, then override them by ancillary
   2840   1.97    rpaulo 		 * objects.
   2841   1.97    rpaulo 		 * XXX: copypktopts() does not copy the cached route to a next
   2842   1.97    rpaulo 		 * hop (if any).  This is not very good in terms of efficiency,
   2843   1.97    rpaulo 		 * but we can allow this since this option should be rarely
   2844   1.97    rpaulo 		 * used.
   2845   1.97    rpaulo 		 */
   2846   1.97    rpaulo 		if ((error = copypktopts(opt, stickyopt, M_NOWAIT)) != 0)
   2847   1.97    rpaulo 			return (error);
   2848   1.97    rpaulo 	}
   2849    1.2    itojun 
   2850    1.2    itojun 	/*
   2851    1.2    itojun 	 * XXX: Currently, we assume all the optional information is stored
   2852    1.2    itojun 	 * in a single mbuf.
   2853    1.2    itojun 	 */
   2854    1.2    itojun 	if (control->m_next)
   2855   1.57    itojun 		return (EINVAL);
   2856    1.2    itojun 
   2857    1.2    itojun 	for (; control->m_len; control->m_data += CMSG_ALIGN(cm->cmsg_len),
   2858   1.49    itojun 	    control->m_len -= CMSG_ALIGN(cm->cmsg_len)) {
   2859   1.97    rpaulo 		int error;
   2860   1.97    rpaulo 
   2861   1.97    rpaulo 		if (control->m_len < CMSG_LEN(0))
   2862   1.97    rpaulo 			return (EINVAL);
   2863   1.97    rpaulo 
   2864    1.2    itojun 		cm = mtod(control, struct cmsghdr *);
   2865    1.2    itojun 		if (cm->cmsg_len == 0 || cm->cmsg_len > control->m_len)
   2866   1.57    itojun 			return (EINVAL);
   2867    1.2    itojun 		if (cm->cmsg_level != IPPROTO_IPV6)
   2868    1.2    itojun 			continue;
   2869    1.2    itojun 
   2870   1.97    rpaulo 		error = ip6_setpktopt(cm->cmsg_type, CMSG_DATA(cm),
   2871   1.97    rpaulo 		    cm->cmsg_len - CMSG_LEN(0), opt, priv, 0, 1, uproto);
   2872   1.97    rpaulo 		if (error)
   2873   1.97    rpaulo 			return (error);
   2874   1.97    rpaulo 	}
   2875   1.97    rpaulo 
   2876   1.97    rpaulo 	return (0);
   2877   1.97    rpaulo }
   2878   1.97    rpaulo 
   2879   1.97    rpaulo /*
   2880   1.97    rpaulo  * Set a particular packet option, as a sticky option or an ancillary data
   2881   1.97    rpaulo  * item.  "len" can be 0 only when it's a sticky option.
   2882   1.97    rpaulo  * We have 4 cases of combination of "sticky" and "cmsg":
   2883   1.97    rpaulo  * "sticky=0, cmsg=0": impossible
   2884   1.97    rpaulo  * "sticky=0, cmsg=1": RFC2292 or RFC3542 ancillary data
   2885   1.97    rpaulo  * "sticky=1, cmsg=0": RFC3542 socket option
   2886   1.97    rpaulo  * "sticky=1, cmsg=1": RFC2292 socket option
   2887   1.97    rpaulo  */
   2888   1.97    rpaulo static int
   2889   1.97    rpaulo ip6_setpktopt(int optname, u_char *buf, int len, struct ip6_pktopts *opt,
   2890   1.97    rpaulo     int priv, int sticky, int cmsg, int uproto)
   2891   1.97    rpaulo {
   2892   1.97    rpaulo 	int minmtupolicy;
   2893   1.97    rpaulo 
   2894   1.97    rpaulo 	if (!sticky && !cmsg) {
   2895   1.97    rpaulo #ifdef DIAGNOSTIC
   2896   1.97    rpaulo 		printf("ip6_setpktopt: impossible case\n");
   2897   1.97    rpaulo #endif
   2898   1.97    rpaulo 		return (EINVAL);
   2899   1.97    rpaulo 	}
   2900   1.97    rpaulo 
   2901   1.97    rpaulo 	/*
   2902   1.97    rpaulo 	 * IPV6_2292xxx is for backward compatibility to RFC2292, and should
   2903   1.97    rpaulo 	 * not be specified in the context of RFC3542.  Conversely,
   2904   1.97    rpaulo 	 * RFC3542 types should not be specified in the context of RFC2292.
   2905   1.97    rpaulo 	 */
   2906   1.97    rpaulo 	if (!cmsg) {
   2907   1.97    rpaulo 		switch (optname) {
   2908   1.97    rpaulo 		case IPV6_2292PKTINFO:
   2909   1.97    rpaulo 		case IPV6_2292HOPLIMIT:
   2910   1.97    rpaulo 		case IPV6_2292NEXTHOP:
   2911   1.97    rpaulo 		case IPV6_2292HOPOPTS:
   2912   1.97    rpaulo 		case IPV6_2292DSTOPTS:
   2913   1.97    rpaulo 		case IPV6_2292RTHDR:
   2914   1.97    rpaulo 		case IPV6_2292PKTOPTIONS:
   2915   1.97    rpaulo 			return (ENOPROTOOPT);
   2916   1.97    rpaulo 		}
   2917   1.97    rpaulo 	}
   2918   1.97    rpaulo 	if (sticky && cmsg) {
   2919   1.97    rpaulo 		switch (optname) {
   2920    1.2    itojun 		case IPV6_PKTINFO:
   2921   1.97    rpaulo 		case IPV6_HOPLIMIT:
   2922   1.97    rpaulo 		case IPV6_NEXTHOP:
   2923   1.97    rpaulo 		case IPV6_HOPOPTS:
   2924   1.97    rpaulo 		case IPV6_DSTOPTS:
   2925   1.97    rpaulo 		case IPV6_RTHDRDSTOPTS:
   2926   1.97    rpaulo 		case IPV6_RTHDR:
   2927   1.97    rpaulo 		case IPV6_USE_MIN_MTU:
   2928   1.97    rpaulo 		case IPV6_DONTFRAG:
   2929   1.97    rpaulo 		case IPV6_OTCLASS:
   2930   1.97    rpaulo 		case IPV6_TCLASS:
   2931   1.97    rpaulo 			return (ENOPROTOOPT);
   2932   1.97    rpaulo 		}
   2933   1.97    rpaulo 	}
   2934   1.97    rpaulo 
   2935   1.97    rpaulo 	switch (optname) {
   2936   1.97    rpaulo #ifdef RFC2292
   2937   1.97    rpaulo 	case IPV6_2292PKTINFO:
   2938   1.97    rpaulo #endif
   2939   1.97    rpaulo 	case IPV6_PKTINFO:
   2940   1.97    rpaulo 	{
   2941   1.97    rpaulo 		struct ifnet *ifp = NULL;
   2942   1.97    rpaulo 		struct in6_pktinfo *pktinfo;
   2943   1.97    rpaulo 
   2944   1.97    rpaulo 		if (len != sizeof(struct in6_pktinfo))
   2945   1.97    rpaulo 			return (EINVAL);
   2946   1.97    rpaulo 
   2947   1.97    rpaulo 		pktinfo = (struct in6_pktinfo *)buf;
   2948   1.97    rpaulo 
   2949   1.97    rpaulo 		/*
   2950   1.97    rpaulo 		 * An application can clear any sticky IPV6_PKTINFO option by
   2951   1.97    rpaulo 		 * doing a "regular" setsockopt with ipi6_addr being
   2952   1.97    rpaulo 		 * in6addr_any and ipi6_ifindex being zero.
   2953   1.97    rpaulo 		 * [RFC 3542, Section 6]
   2954   1.97    rpaulo 		 */
   2955   1.97    rpaulo 		if (optname == IPV6_PKTINFO && opt->ip6po_pktinfo &&
   2956   1.97    rpaulo 		    pktinfo->ipi6_ifindex == 0 &&
   2957   1.97    rpaulo 		    IN6_IS_ADDR_UNSPECIFIED(&pktinfo->ipi6_addr)) {
   2958   1.97    rpaulo 			ip6_clearpktopts(opt, optname);
   2959   1.97    rpaulo 			break;
   2960   1.97    rpaulo 		}
   2961   1.97    rpaulo 
   2962   1.97    rpaulo 		if (uproto == IPPROTO_TCP && optname == IPV6_PKTINFO &&
   2963   1.97    rpaulo 		    sticky && !IN6_IS_ADDR_UNSPECIFIED(&pktinfo->ipi6_addr)) {
   2964   1.97    rpaulo 			return (EINVAL);
   2965   1.97    rpaulo 		}
   2966   1.97    rpaulo 
   2967   1.97    rpaulo 		/* validate the interface index if specified. */
   2968  1.102  christos 		if (pktinfo->ipi6_ifindex >= if_indexlim) {
   2969   1.97    rpaulo 			 return (ENXIO);
   2970   1.97    rpaulo 		}
   2971   1.97    rpaulo 		if (pktinfo->ipi6_ifindex) {
   2972   1.97    rpaulo 			ifp = ifindex2ifnet[pktinfo->ipi6_ifindex];
   2973   1.97    rpaulo 			if (ifp == NULL)
   2974   1.57    itojun 				return (ENXIO);
   2975   1.97    rpaulo 		}
   2976   1.97    rpaulo 
   2977   1.97    rpaulo 		/*
   2978   1.97    rpaulo 		 * We store the address anyway, and let in6_selectsrc()
   2979   1.97    rpaulo 		 * validate the specified address.  This is because ipi6_addr
   2980   1.97    rpaulo 		 * may not have enough information about its scope zone, and
   2981   1.97    rpaulo 		 * we may need additional information (such as outgoing
   2982   1.97    rpaulo 		 * interface or the scope zone of a destination address) to
   2983   1.97    rpaulo 		 * disambiguate the scope.
   2984   1.97    rpaulo 		 * XXX: the delay of the validation may confuse the
   2985   1.97    rpaulo 		 * application when it is used as a sticky option.
   2986   1.97    rpaulo 		 */
   2987   1.97    rpaulo 		if (opt->ip6po_pktinfo == NULL) {
   2988   1.97    rpaulo 			opt->ip6po_pktinfo = malloc(sizeof(*pktinfo),
   2989   1.97    rpaulo 			    M_IP6OPT, M_NOWAIT);
   2990   1.97    rpaulo 			if (opt->ip6po_pktinfo == NULL)
   2991   1.97    rpaulo 				return (ENOBUFS);
   2992   1.97    rpaulo 		}
   2993   1.97    rpaulo 		memcpy(opt->ip6po_pktinfo, pktinfo, sizeof(*pktinfo));
   2994   1.97    rpaulo 		break;
   2995   1.97    rpaulo 	}
   2996   1.97    rpaulo 
   2997   1.97    rpaulo #ifdef RFC2292
   2998   1.97    rpaulo 	case IPV6_2292HOPLIMIT:
   2999   1.97    rpaulo #endif
   3000   1.97    rpaulo 	case IPV6_HOPLIMIT:
   3001   1.97    rpaulo 	{
   3002   1.97    rpaulo 		int *hlimp;
   3003   1.97    rpaulo 
   3004   1.97    rpaulo 		/*
   3005   1.97    rpaulo 		 * RFC 3542 deprecated the usage of sticky IPV6_HOPLIMIT
   3006   1.97    rpaulo 		 * to simplify the ordering among hoplimit options.
   3007   1.97    rpaulo 		 */
   3008   1.97    rpaulo 		if (optname == IPV6_HOPLIMIT && sticky)
   3009   1.97    rpaulo 			return (ENOPROTOOPT);
   3010   1.97    rpaulo 
   3011   1.97    rpaulo 		if (len != sizeof(int))
   3012   1.97    rpaulo 			return (EINVAL);
   3013   1.97    rpaulo 		hlimp = (int *)buf;
   3014   1.97    rpaulo 		if (*hlimp < -1 || *hlimp > 255)
   3015   1.97    rpaulo 			return (EINVAL);
   3016   1.97    rpaulo 
   3017   1.97    rpaulo 		opt->ip6po_hlim = *hlimp;
   3018   1.97    rpaulo 		break;
   3019   1.97    rpaulo 	}
   3020   1.97    rpaulo 
   3021   1.97    rpaulo 	case IPV6_OTCLASS:
   3022   1.97    rpaulo 		if (len != sizeof(u_int8_t))
   3023   1.97    rpaulo 			return (EINVAL);
   3024   1.97    rpaulo 
   3025   1.97    rpaulo 		opt->ip6po_tclass = *(u_int8_t *)buf;
   3026   1.97    rpaulo 		break;
   3027   1.97    rpaulo 
   3028   1.97    rpaulo 	case IPV6_TCLASS:
   3029   1.97    rpaulo 	{
   3030   1.97    rpaulo 		int tclass;
   3031   1.97    rpaulo 
   3032   1.97    rpaulo 		if (len != sizeof(int))
   3033   1.97    rpaulo 			return (EINVAL);
   3034   1.97    rpaulo 		tclass = *(int *)buf;
   3035   1.97    rpaulo 		if (tclass < -1 || tclass > 255)
   3036   1.97    rpaulo 			return (EINVAL);
   3037    1.2    itojun 
   3038   1.97    rpaulo 		opt->ip6po_tclass = tclass;
   3039   1.97    rpaulo 		break;
   3040   1.97    rpaulo 	}
   3041   1.94    rpaulo 
   3042   1.97    rpaulo #ifdef RFC2292
   3043   1.97    rpaulo 	case IPV6_2292NEXTHOP:
   3044   1.97    rpaulo #endif
   3045   1.97    rpaulo 	case IPV6_NEXTHOP:
   3046   1.97    rpaulo 		if (!priv)
   3047   1.97    rpaulo 			return (EPERM);
   3048   1.35    itojun 
   3049   1.97    rpaulo 		if (len == 0) {	/* just remove the option */
   3050   1.97    rpaulo 			ip6_clearpktopts(opt, IPV6_NEXTHOP);
   3051    1.2    itojun 			break;
   3052   1.97    rpaulo 		}
   3053   1.97    rpaulo 
   3054   1.97    rpaulo 		/* check if cmsg_len is large enough for sa_len */
   3055   1.97    rpaulo 		if (len < sizeof(struct sockaddr) || len < *buf)
   3056   1.97    rpaulo 			return (EINVAL);
   3057   1.97    rpaulo 
   3058   1.97    rpaulo 		switch (((struct sockaddr *)buf)->sa_family) {
   3059   1.97    rpaulo 		case AF_INET6:
   3060   1.97    rpaulo 		{
   3061   1.97    rpaulo 			struct sockaddr_in6 *sa6 = (struct sockaddr_in6 *)buf;
   3062   1.97    rpaulo 			int error;
   3063    1.2    itojun 
   3064   1.97    rpaulo 			if (sa6->sin6_len != sizeof(struct sockaddr_in6))
   3065   1.57    itojun 				return (EINVAL);
   3066    1.2    itojun 
   3067   1.97    rpaulo 			if (IN6_IS_ADDR_UNSPECIFIED(&sa6->sin6_addr) ||
   3068   1.97    rpaulo 			    IN6_IS_ADDR_MULTICAST(&sa6->sin6_addr)) {
   3069   1.97    rpaulo 				return (EINVAL);
   3070   1.97    rpaulo 			}
   3071   1.97    rpaulo 			if ((error = sa6_embedscope(sa6, ip6_use_defzone))
   3072   1.97    rpaulo 			    != 0) {
   3073   1.97    rpaulo 				return (error);
   3074   1.67    itojun 			}
   3075    1.2    itojun 			break;
   3076   1.97    rpaulo 		}
   3077   1.97    rpaulo 		case AF_LINK:	/* eventually be supported? */
   3078   1.97    rpaulo 		default:
   3079   1.97    rpaulo 			return (EAFNOSUPPORT);
   3080   1.97    rpaulo 		}
   3081    1.2    itojun 
   3082   1.97    rpaulo 		/* turn off the previous option, then set the new option. */
   3083   1.97    rpaulo 		ip6_clearpktopts(opt, IPV6_NEXTHOP);
   3084   1.97    rpaulo 		opt->ip6po_nexthop = malloc(*buf, M_IP6OPT, M_NOWAIT);
   3085   1.97    rpaulo 		if (opt->ip6po_nexthop == NULL)
   3086   1.97    rpaulo 			return (ENOBUFS);
   3087   1.97    rpaulo 		memcpy(opt->ip6po_nexthop, buf, *buf);
   3088   1.97    rpaulo 		break;
   3089   1.97    rpaulo 
   3090   1.97    rpaulo #ifdef RFC2292
   3091   1.97    rpaulo 	case IPV6_2292HOPOPTS:
   3092   1.97    rpaulo #endif
   3093   1.97    rpaulo 	case IPV6_HOPOPTS:
   3094   1.97    rpaulo 	{
   3095   1.97    rpaulo 		struct ip6_hbh *hbh;
   3096   1.97    rpaulo 		int hbhlen;
   3097   1.97    rpaulo 
   3098   1.97    rpaulo 		/*
   3099   1.97    rpaulo 		 * XXX: We don't allow a non-privileged user to set ANY HbH
   3100   1.97    rpaulo 		 * options, since per-option restriction has too much
   3101   1.97    rpaulo 		 * overhead.
   3102   1.97    rpaulo 		 */
   3103   1.97    rpaulo 		if (!priv)
   3104   1.97    rpaulo 			return (EPERM);
   3105   1.97    rpaulo 
   3106   1.97    rpaulo 		if (len == 0) {
   3107   1.97    rpaulo 			ip6_clearpktopts(opt, IPV6_HOPOPTS);
   3108   1.97    rpaulo 			break;	/* just remove the option */
   3109   1.97    rpaulo 		}
   3110   1.31    itojun 
   3111   1.97    rpaulo 		/* message length validation */
   3112   1.97    rpaulo 		if (len < sizeof(struct ip6_hbh))
   3113   1.97    rpaulo 			return (EINVAL);
   3114   1.97    rpaulo 		hbh = (struct ip6_hbh *)buf;
   3115   1.97    rpaulo 		hbhlen = (hbh->ip6h_len + 1) << 3;
   3116   1.97    rpaulo 		if (len != hbhlen)
   3117   1.97    rpaulo 			return (EINVAL);
   3118    1.2    itojun 
   3119   1.97    rpaulo 		/* turn off the previous option, then set the new option. */
   3120   1.97    rpaulo 		ip6_clearpktopts(opt, IPV6_HOPOPTS);
   3121   1.97    rpaulo 		opt->ip6po_hbh = malloc(hbhlen, M_IP6OPT, M_NOWAIT);
   3122   1.97    rpaulo 		if (opt->ip6po_hbh == NULL)
   3123   1.97    rpaulo 			return (ENOBUFS);
   3124   1.97    rpaulo 		memcpy(opt->ip6po_hbh, hbh, hbhlen);
   3125    1.2    itojun 
   3126   1.97    rpaulo 		break;
   3127   1.97    rpaulo 	}
   3128    1.2    itojun 
   3129   1.97    rpaulo #ifdef RFC2292
   3130   1.97    rpaulo 	case IPV6_2292DSTOPTS:
   3131   1.97    rpaulo #endif
   3132   1.97    rpaulo 	case IPV6_DSTOPTS:
   3133   1.97    rpaulo 	case IPV6_RTHDRDSTOPTS:
   3134   1.97    rpaulo 	{
   3135   1.97    rpaulo 		struct ip6_dest *dest, **newdest = NULL;
   3136   1.97    rpaulo 		int destlen;
   3137   1.67    itojun 
   3138   1.97    rpaulo 		if (!priv)	/* XXX: see the comment for IPV6_HOPOPTS */
   3139   1.97    rpaulo 			return (EPERM);
   3140    1.2    itojun 
   3141   1.97    rpaulo 		if (len == 0) {
   3142   1.97    rpaulo 			ip6_clearpktopts(opt, optname);
   3143   1.97    rpaulo 			break;	/* just remove the option */
   3144   1.97    rpaulo 		}
   3145    1.2    itojun 
   3146   1.97    rpaulo 		/* message length validation */
   3147   1.97    rpaulo 		if (len < sizeof(struct ip6_dest))
   3148   1.97    rpaulo 			return (EINVAL);
   3149   1.97    rpaulo 		dest = (struct ip6_dest *)buf;
   3150   1.97    rpaulo 		destlen = (dest->ip6d_len + 1) << 3;
   3151   1.97    rpaulo 		if (len != destlen)
   3152   1.97    rpaulo 			return (EINVAL);
   3153   1.97    rpaulo 		/*
   3154   1.97    rpaulo 		 * Determine the position that the destination options header
   3155   1.97    rpaulo 		 * should be inserted; before or after the routing header.
   3156   1.97    rpaulo 		 */
   3157   1.97    rpaulo 		switch (optname) {
   3158   1.97    rpaulo 		case IPV6_2292DSTOPTS:
   3159    1.2    itojun 			/*
   3160   1.97    rpaulo 			 * The old advanced API is ambiguous on this point.
   3161   1.97    rpaulo 			 * Our approach is to determine the position based
   3162   1.97    rpaulo 			 * according to the existence of a routing header.
   3163   1.97    rpaulo 			 * Note, however, that this depends on the order of the
   3164   1.97    rpaulo 			 * extension headers in the ancillary data; the 1st
   3165   1.97    rpaulo 			 * part of the destination options header must appear
   3166   1.97    rpaulo 			 * before the routing header in the ancillary data,
   3167   1.97    rpaulo 			 * too.
   3168   1.97    rpaulo 			 * RFC3542 solved the ambiguity by introducing
   3169   1.97    rpaulo 			 * separate ancillary data or option types.
   3170    1.2    itojun 			 */
   3171   1.97    rpaulo 			if (opt->ip6po_rthdr == NULL)
   3172   1.97    rpaulo 				newdest = &opt->ip6po_dest1;
   3173   1.97    rpaulo 			else
   3174   1.97    rpaulo 				newdest = &opt->ip6po_dest2;
   3175   1.97    rpaulo 			break;
   3176   1.97    rpaulo 		case IPV6_RTHDRDSTOPTS:
   3177   1.97    rpaulo 			newdest = &opt->ip6po_dest1;
   3178   1.97    rpaulo 			break;
   3179   1.97    rpaulo 		case IPV6_DSTOPTS:
   3180   1.97    rpaulo 			newdest = &opt->ip6po_dest2;
   3181   1.97    rpaulo 			break;
   3182   1.97    rpaulo 		}
   3183   1.97    rpaulo 
   3184   1.97    rpaulo 		/* turn off the previous option, then set the new option. */
   3185   1.97    rpaulo 		ip6_clearpktopts(opt, optname);
   3186   1.97    rpaulo 		*newdest = malloc(destlen, M_IP6OPT, M_NOWAIT);
   3187   1.97    rpaulo 		if (*newdest == NULL)
   3188   1.97    rpaulo 			return (ENOBUFS);
   3189   1.97    rpaulo 		memcpy(*newdest, dest, destlen);
   3190   1.67    itojun 
   3191   1.97    rpaulo 		break;
   3192   1.97    rpaulo 	}
   3193   1.97    rpaulo 
   3194   1.97    rpaulo #ifdef RFC2292
   3195   1.97    rpaulo 	case IPV6_2292RTHDR:
   3196   1.97    rpaulo #endif
   3197   1.97    rpaulo 	case IPV6_RTHDR:
   3198   1.97    rpaulo 	{
   3199   1.97    rpaulo 		struct ip6_rthdr *rth;
   3200   1.97    rpaulo 		int rthlen;
   3201   1.97    rpaulo 
   3202   1.97    rpaulo 		if (len == 0) {
   3203   1.97    rpaulo 			ip6_clearpktopts(opt, IPV6_RTHDR);
   3204   1.97    rpaulo 			break;	/* just remove the option */
   3205   1.97    rpaulo 		}
   3206    1.2    itojun 
   3207   1.97    rpaulo 		/* message length validation */
   3208   1.97    rpaulo 		if (len < sizeof(struct ip6_rthdr))
   3209   1.97    rpaulo 			return (EINVAL);
   3210   1.97    rpaulo 		rth = (struct ip6_rthdr *)buf;
   3211   1.97    rpaulo 		rthlen = (rth->ip6r_len + 1) << 3;
   3212   1.97    rpaulo 		if (len != rthlen)
   3213   1.97    rpaulo 			return (EINVAL);
   3214   1.97    rpaulo 		switch (rth->ip6r_type) {
   3215   1.97    rpaulo 		case IPV6_RTHDR_TYPE_0:
   3216   1.97    rpaulo 			if (rth->ip6r_len == 0)	/* must contain one addr */
   3217   1.97    rpaulo 				return (EINVAL);
   3218   1.97    rpaulo 			if (rth->ip6r_len % 2) /* length must be even */
   3219   1.97    rpaulo 				return (EINVAL);
   3220   1.97    rpaulo 			if (rth->ip6r_len / 2 != rth->ip6r_segleft)
   3221   1.57    itojun 				return (EINVAL);
   3222    1.2    itojun 			break;
   3223    1.2    itojun 		default:
   3224   1.97    rpaulo 			return (EINVAL);	/* not supported */
   3225    1.2    itojun 		}
   3226   1.97    rpaulo 		/* turn off the previous option */
   3227   1.97    rpaulo 		ip6_clearpktopts(opt, IPV6_RTHDR);
   3228   1.97    rpaulo 		opt->ip6po_rthdr = malloc(rthlen, M_IP6OPT, M_NOWAIT);
   3229   1.97    rpaulo 		if (opt->ip6po_rthdr == NULL)
   3230   1.97    rpaulo 			return (ENOBUFS);
   3231   1.97    rpaulo 		memcpy(opt->ip6po_rthdr, rth, rthlen);
   3232   1.97    rpaulo 		break;
   3233    1.2    itojun 	}
   3234    1.2    itojun 
   3235   1.97    rpaulo 	case IPV6_USE_MIN_MTU:
   3236   1.97    rpaulo 		if (len != sizeof(int))
   3237   1.97    rpaulo 			return (EINVAL);
   3238   1.97    rpaulo 		minmtupolicy = *(int *)buf;
   3239   1.97    rpaulo 		if (minmtupolicy != IP6PO_MINMTU_MCASTONLY &&
   3240   1.97    rpaulo 		    minmtupolicy != IP6PO_MINMTU_DISABLE &&
   3241   1.97    rpaulo 		    minmtupolicy != IP6PO_MINMTU_ALL) {
   3242   1.97    rpaulo 			return (EINVAL);
   3243   1.97    rpaulo 		}
   3244   1.97    rpaulo 		opt->ip6po_minmtu = minmtupolicy;
   3245   1.97    rpaulo 		break;
   3246   1.97    rpaulo 
   3247   1.97    rpaulo 	case IPV6_DONTFRAG:
   3248   1.97    rpaulo 		if (len != sizeof(int))
   3249   1.97    rpaulo 			return (EINVAL);
   3250   1.97    rpaulo 
   3251   1.97    rpaulo 		if (uproto == IPPROTO_TCP || *(int *)buf == 0) {
   3252   1.97    rpaulo 			/*
   3253   1.97    rpaulo 			 * we ignore this option for TCP sockets.
   3254   1.97    rpaulo 			 * (RFC3542 leaves this case unspecified.)
   3255   1.97    rpaulo 			 */
   3256   1.97    rpaulo 			opt->ip6po_flags &= ~IP6PO_DONTFRAG;
   3257   1.97    rpaulo 		} else
   3258   1.97    rpaulo 			opt->ip6po_flags |= IP6PO_DONTFRAG;
   3259   1.97    rpaulo 		break;
   3260   1.97    rpaulo 
   3261   1.97    rpaulo 	default:
   3262   1.97    rpaulo 		return (ENOPROTOOPT);
   3263   1.97    rpaulo 	} /* end of switch */
   3264   1.97    rpaulo 
   3265   1.57    itojun 	return (0);
   3266    1.2    itojun }
   3267    1.2    itojun 
   3268    1.2    itojun /*
   3269    1.2    itojun  * Routine called from ip6_output() to loop back a copy of an IP6 multicast
   3270    1.2    itojun  * packet to the input queue of a specified interface.  Note that this
   3271    1.2    itojun  * calls the output routine of the loopback "driver", but with an interface
   3272   1.86     peter  * pointer that might NOT be lo0ifp -- easier than replicating that code here.
   3273    1.2    itojun  */
   3274    1.2    itojun void
   3275  1.119  christos ip6_mloopback(struct ifnet *ifp, struct mbuf *m,
   3276  1.119  christos 	const struct sockaddr_in6 *dst)
   3277    1.2    itojun {
   3278   1.22    itojun 	struct mbuf *copym;
   3279   1.22    itojun 	struct ip6_hdr *ip6;
   3280    1.2    itojun 
   3281    1.2    itojun 	copym = m_copy(m, 0, M_COPYALL);
   3282   1.22    itojun 	if (copym == NULL)
   3283   1.22    itojun 		return;
   3284   1.22    itojun 
   3285   1.22    itojun 	/*
   3286   1.22    itojun 	 * Make sure to deep-copy IPv6 header portion in case the data
   3287   1.22    itojun 	 * is in an mbuf cluster, so that we can safely override the IPv6
   3288   1.22    itojun 	 * header portion later.
   3289   1.22    itojun 	 */
   3290   1.22    itojun 	if ((copym->m_flags & M_EXT) != 0 ||
   3291   1.22    itojun 	    copym->m_len < sizeof(struct ip6_hdr)) {
   3292   1.22    itojun 		copym = m_pullup(copym, sizeof(struct ip6_hdr));
   3293   1.22    itojun 		if (copym == NULL)
   3294   1.22    itojun 			return;
   3295   1.22    itojun 	}
   3296   1.22    itojun 
   3297   1.22    itojun #ifdef DIAGNOSTIC
   3298   1.22    itojun 	if (copym->m_len < sizeof(*ip6)) {
   3299   1.22    itojun 		m_freem(copym);
   3300   1.22    itojun 		return;
   3301   1.22    itojun 	}
   3302   1.22    itojun #endif
   3303   1.22    itojun 
   3304   1.34    itojun 	ip6 = mtod(copym, struct ip6_hdr *);
   3305   1.94    rpaulo 	/*
   3306   1.94    rpaulo 	 * clear embedded scope identifiers if necessary.
   3307   1.94    rpaulo 	 * in6_clearscope will touch the addresses only when necessary.
   3308   1.94    rpaulo 	 */
   3309   1.94    rpaulo 	in6_clearscope(&ip6->ip6_src);
   3310   1.94    rpaulo 	in6_clearscope(&ip6->ip6_dst);
   3311   1.22    itojun 
   3312  1.115    dyoung 	(void)looutput(ifp, copym, (const struct sockaddr *)dst, NULL);
   3313    1.2    itojun }
   3314    1.2    itojun 
   3315    1.2    itojun /*
   3316    1.2    itojun  * Chop IPv6 header off from the payload.
   3317    1.2    itojun  */
   3318    1.2    itojun static int
   3319  1.119  christos ip6_splithdr(struct mbuf *m,  struct ip6_exthdrs *exthdrs)
   3320    1.2    itojun {
   3321    1.2    itojun 	struct mbuf *mh;
   3322    1.2    itojun 	struct ip6_hdr *ip6;
   3323    1.2    itojun 
   3324    1.2    itojun 	ip6 = mtod(m, struct ip6_hdr *);
   3325    1.2    itojun 	if (m->m_len > sizeof(*ip6)) {
   3326    1.2    itojun 		MGETHDR(mh, M_DONTWAIT, MT_HEADER);
   3327    1.2    itojun 		if (mh == 0) {
   3328    1.2    itojun 			m_freem(m);
   3329    1.2    itojun 			return ENOBUFS;
   3330    1.2    itojun 		}
   3331   1.91      yamt 		M_MOVE_PKTHDR(mh, m);
   3332    1.2    itojun 		MH_ALIGN(mh, sizeof(*ip6));
   3333    1.2    itojun 		m->m_len -= sizeof(*ip6);
   3334    1.2    itojun 		m->m_data += sizeof(*ip6);
   3335    1.2    itojun 		mh->m_next = m;
   3336    1.2    itojun 		m = mh;
   3337    1.2    itojun 		m->m_len = sizeof(*ip6);
   3338  1.117  christos 		bcopy((void *)ip6, mtod(m, void *), sizeof(*ip6));
   3339    1.2    itojun 	}
   3340    1.2    itojun 	exthdrs->ip6e_ip6 = m;
   3341    1.2    itojun 	return 0;
   3342    1.2    itojun }
   3343    1.2    itojun 
   3344    1.2    itojun /*
   3345    1.2    itojun  * Compute IPv6 extension header length.
   3346    1.2    itojun  */
   3347    1.2    itojun int
   3348  1.119  christos ip6_optlen(struct in6pcb *in6p)
   3349    1.2    itojun {
   3350    1.2    itojun 	int len;
   3351    1.2    itojun 
   3352    1.2    itojun 	if (!in6p->in6p_outputopts)
   3353    1.2    itojun 		return 0;
   3354    1.2    itojun 
   3355    1.2    itojun 	len = 0;
   3356    1.2    itojun #define elen(x) \
   3357    1.2    itojun     (((struct ip6_ext *)(x)) ? (((struct ip6_ext *)(x))->ip6e_len + 1) << 3 : 0)
   3358    1.2    itojun 
   3359    1.2    itojun 	len += elen(in6p->in6p_outputopts->ip6po_hbh);
   3360    1.2    itojun 	len += elen(in6p->in6p_outputopts->ip6po_dest1);
   3361    1.2    itojun 	len += elen(in6p->in6p_outputopts->ip6po_rthdr);
   3362    1.2    itojun 	len += elen(in6p->in6p_outputopts->ip6po_dest2);
   3363    1.2    itojun 	return len;
   3364    1.2    itojun #undef elen
   3365    1.2    itojun }
   3366