Home | History | Annotate | Line # | Download | only in libsockin
sockin.c revision 1.10
      1 /*	$NetBSD: sockin.c,v 1.10 2009/01/26 13:44:51 pooka Exp $	*/
      2 
      3 /*
      4  * Copyright (c) 2008, 2009 Antti Kantee.  All Rights Reserved.
      5  *
      6  * Redistribution and use in source and binary forms, with or without
      7  * modification, are permitted provided that the following conditions
      8  * are met:
      9  * 1. Redistributions of source code must retain the above copyright
     10  *    notice, this list of conditions and the following disclaimer.
     11  * 2. Redistributions in binary form must reproduce the above copyright
     12  *    notice, this list of conditions and the following disclaimer in the
     13  *    documentation and/or other materials provided with the distribution.
     14  *
     15  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
     16  * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
     17  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
     18  * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     19  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     20  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
     21  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     22  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     23  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     24  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     25  * SUCH DAMAGE.
     26  */
     27 
     28 #include <sys/cdefs.h>
     29 __KERNEL_RCSID(0, "$NetBSD: sockin.c,v 1.10 2009/01/26 13:44:51 pooka Exp $");
     30 
     31 #include <sys/param.h>
     32 #include <sys/condvar.h>
     33 #include <sys/domain.h>
     34 #include <sys/kmem.h>
     35 #include <sys/kthread.h>
     36 #include <sys/mbuf.h>
     37 #include <sys/mutex.h>
     38 #include <sys/poll.h>
     39 #include <sys/protosw.h>
     40 #include <sys/queue.h>
     41 #include <sys/socket.h>
     42 #include <sys/socketvar.h>
     43 #include <sys/time.h>
     44 
     45 #include <net/radix.h>
     46 
     47 #include <netinet/in.h>
     48 #include <netinet/in_systm.h>
     49 #include <netinet/ip.h>
     50 
     51 #include <rump/rumpuser.h>
     52 
     53 #include "rump_private.h"
     54 
     55 /*
     56  * An inet communication domain which uses the socket interface.
     57  * Currently supports only IPv4 UDP, but could easily be extended to
     58  * support IPv6 and TCP by adding more stuff to the protosw.
     59  */
     60 
     61 DOMAIN_DEFINE(sockindomain);
     62 
     63 static void	sockin_init(void);
     64 static int	sockin_usrreq(struct socket *, int, struct mbuf *,
     65 			      struct mbuf *, struct mbuf *, struct lwp *);
     66 static int	sockin_ctloutput(int op, struct socket *, struct sockopt *);
     67 
     68 const struct protosw sockinsw[] = {
     69 {
     70 	.pr_type = SOCK_DGRAM,
     71 	.pr_domain = &sockindomain,
     72 	.pr_protocol = IPPROTO_UDP,
     73 	.pr_flags = PR_ATOMIC|PR_ADDR,
     74 	.pr_usrreq = sockin_usrreq,
     75 	.pr_ctloutput = sockin_ctloutput,
     76 },
     77 {
     78 	.pr_type = SOCK_STREAM,
     79 	.pr_domain = &sockindomain,
     80 	.pr_protocol = IPPROTO_TCP,
     81 	.pr_flags = PR_CONNREQUIRED|PR_WANTRCVD|PR_LISTEN|PR_ABRTACPTDIS,
     82 	.pr_usrreq = sockin_usrreq,
     83 	.pr_ctloutput = sockin_ctloutput,
     84 }};
     85 
     86 struct domain sockindomain = {
     87 	.dom_family = PF_INET,
     88 	.dom_name = "socket_inet",
     89 	.dom_init = sockin_init,
     90 	.dom_externalize = NULL,
     91 	.dom_dispose = NULL,
     92 	.dom_protosw = sockinsw,
     93 	.dom_protoswNPROTOSW = &sockinsw[__arraycount(sockinsw)],
     94 	.dom_rtattach = rn_inithead,
     95 	.dom_rtoffset = 32,
     96 	.dom_maxrtkey = sizeof(struct sockaddr_in),
     97 	.dom_ifattach = NULL,
     98 	.dom_ifdetach = NULL,
     99 	.dom_ifqueues = { NULL },
    100 	.dom_link = { NULL },
    101 	.dom_mowner = MOWNER_INIT("",""),
    102 	.dom_rtcache = { NULL },
    103 	.dom_sockaddr_cmp = NULL
    104 };
    105 
    106 #define SO2S(so) ((intptr_t)(so->so_internal))
    107 #define SOCKIN_SBSIZE 65536
    108 
    109 struct sockin_unit {
    110 	struct socket *su_so;
    111 
    112 	LIST_ENTRY(sockin_unit) su_entries;
    113 };
    114 static LIST_HEAD(, sockin_unit) su_ent = LIST_HEAD_INITIALIZER(su_ent);
    115 static kmutex_t su_mtx;
    116 static bool rebuild;
    117 static int nsock;
    118 
    119 static int
    120 registersock(struct socket *so, int news)
    121 {
    122 	struct sockin_unit *su;
    123 
    124 	su = kmem_alloc(sizeof(*su), KM_NOSLEEP);
    125 	if (!su)
    126 		return ENOMEM;
    127 
    128 	so->so_internal = (void *)(intptr_t)news;
    129 	su->su_so = so;
    130 
    131 	mutex_enter(&su_mtx);
    132 	LIST_INSERT_HEAD(&su_ent, su, su_entries);
    133 	nsock++;
    134 	rebuild = true;
    135 	mutex_exit(&su_mtx);
    136 
    137 	return 0;
    138 }
    139 
    140 static void
    141 removesock(struct socket *so)
    142 {
    143 	struct sockin_unit *su_iter;
    144 	int error;
    145 
    146 	mutex_enter(&su_mtx);
    147 	LIST_FOREACH(su_iter, &su_ent, su_entries) {
    148 		if (su_iter->su_so == so)
    149 			break;
    150 	}
    151 	if (!su_iter)
    152 		panic("no such socket");
    153 
    154 	LIST_REMOVE(su_iter, su_entries);
    155 	nsock--;
    156 	rebuild = true;
    157 	mutex_exit(&su_mtx);
    158 
    159 	rumpuser_close(SO2S(su_iter->su_so), &error);
    160 	kmem_free(su_iter, sizeof(*su_iter));
    161 }
    162 
    163 static void
    164 sockin_process(struct socket *so)
    165 {
    166 	struct sockaddr_in from;
    167 	struct iovec io;
    168 	struct msghdr rmsg;
    169 	struct mbuf *m;
    170 	ssize_t n;
    171 	size_t plen;
    172 	int error;
    173 
    174 	plen = IP_MAXPACKET;
    175 	m = m_gethdr(M_WAIT, MT_DATA);
    176 	MEXTMALLOC(m, plen, M_WAIT);
    177 
    178 	memset(&rmsg, 0, sizeof(rmsg));
    179 	io.iov_base = mtod(m, void *);
    180 	io.iov_len = plen;
    181 	rmsg.msg_iov = &io;
    182 	rmsg.msg_iovlen = 1;
    183 	rmsg.msg_name = (struct sockaddr *)&from;
    184 	rmsg.msg_namelen = sizeof(from);
    185 
    186 	n = rumpuser_net_recvmsg(SO2S(so), &rmsg, 0, &error);
    187 	if (n <= 0) {
    188 		m_freem(m);
    189 
    190 		/* Treat a TCP socket a goner */
    191 		if (so->so_proto->pr_type == SOCK_STREAM && error != EAGAIN) {
    192 			soisdisconnected(so);
    193 			removesock(so);
    194 		}
    195 		return;
    196 	}
    197 	m->m_len = m->m_pkthdr.len = n;
    198 
    199 	if (so->so_proto->pr_type == SOCK_DGRAM) {
    200 		if (!sbappendaddr(&so->so_rcv, rmsg.msg_name, m, NULL)) {
    201 			m_freem(m);
    202 		}
    203 	} else {
    204 		sbappendstream(&so->so_rcv, m);
    205 	}
    206 
    207 	sorwakeup(so);
    208 }
    209 
    210 static void
    211 sockin_accept(struct socket *so)
    212 {
    213 	struct socket *nso;
    214 	struct sockaddr_in sin;
    215 	int news, error, slen;
    216 
    217 	slen = sizeof(sin);
    218 	news = rumpuser_net_accept(SO2S(so), (struct sockaddr *)&sin,
    219 	    &slen, &error);
    220 	if (news == -1)
    221 		return;
    222 
    223 	if ((nso = sonewconn(so, SS_ISCONNECTED)) == NULL)
    224 		goto errout;
    225 	if (registersock(nso, news) != 0)
    226 		goto errout;
    227 	return;
    228 
    229  errout:
    230 	rumpuser_close(news, &error);
    231 	if (nso)
    232 		soclose(nso);
    233 }
    234 
    235 #define POLLTIMEOUT 100	/* check for new entries every 100ms */
    236 
    237 /* XXX: doesn't handle socket (kernel) locking properly? */
    238 static void
    239 sockinworker(void *arg)
    240 {
    241 	struct pollfd *pfds = NULL, *npfds;
    242 	struct sockin_unit *su_iter;
    243 	struct socket *so;
    244 	int cursock = 0, i, rv, error;
    245 
    246 	/*
    247 	 * Loop reading requests.  Check for new sockets periodically
    248 	 * (could be smarter, but I'm lazy).
    249 	 */
    250 	for (;;) {
    251 		if (rebuild) {
    252 			npfds = NULL;
    253 			mutex_enter(&su_mtx);
    254 			if (nsock)
    255 				npfds = kmem_alloc(nsock * sizeof(*npfds),
    256 				    KM_NOSLEEP);
    257 			if (npfds || nsock == 0) {
    258 				if (pfds)
    259 					kmem_free(pfds, cursock*sizeof(*pfds));
    260 				pfds = npfds;
    261 				cursock = nsock;
    262 				rebuild = false;
    263 
    264 				i = 0;
    265 				LIST_FOREACH(su_iter, &su_ent, su_entries) {
    266 					pfds[i].fd = SO2S(su_iter->su_so);
    267 					pfds[i].events = POLLIN;
    268 					pfds[i].revents = 0;
    269 					i++;
    270 				}
    271 				KASSERT(i == nsock);
    272 			}
    273 			mutex_exit(&su_mtx);
    274 		}
    275 
    276 		/* find affected sockets & process */
    277 		rv = rumpuser_poll(pfds, cursock, POLLTIMEOUT, &error);
    278 		for (i = 0; i < cursock && rv > 0; i++) {
    279 			if (pfds[i].revents & POLLIN) {
    280 				mutex_enter(&su_mtx);
    281 				LIST_FOREACH(su_iter, &su_ent, su_entries) {
    282 					if (SO2S(su_iter->su_so)==pfds[i].fd) {
    283 						so = su_iter->su_so;
    284 						mutex_exit(&su_mtx);
    285 						mutex_enter(softnet_lock);
    286 						if(so->so_options&SO_ACCEPTCONN)
    287 							sockin_accept(so);
    288 						else
    289 							sockin_process(so);
    290 						mutex_exit(softnet_lock);
    291 						mutex_enter(&su_mtx);
    292 						break;
    293 					}
    294 				}
    295 				/* if we can't find it, just wing it */
    296 				KASSERT(rebuild || su_iter);
    297 				mutex_exit(&su_mtx);
    298 				pfds[i].revents = 0;
    299 				rv--;
    300 				i = -1;
    301 				continue;
    302 			}
    303 
    304 			/* something else?  ignore */
    305 			if (pfds[i].revents) {
    306 				pfds[i].revents = 0;
    307 				rv--;
    308 			}
    309 		}
    310 		KASSERT(rv <= 0);
    311 	}
    312 
    313 }
    314 
    315 static void
    316 sockin_init()
    317 {
    318 	int rv;
    319 
    320 	if (rump_threads) {
    321 		if ((rv = kthread_create(PRI_NONE, 0, NULL, sockinworker,
    322 		    NULL, NULL, "sockwork")) != 0)
    323 			panic("sockin_init: could not create worker thread\n");
    324 	} else {
    325 		printf("sockin_init: no threads => no worker thread\n");
    326 	}
    327 	mutex_init(&su_mtx, MUTEX_DEFAULT, IPL_NONE);
    328 }
    329 
    330 static int
    331 sockin_usrreq(struct socket *so, int req, struct mbuf *m, struct mbuf *nam,
    332 	struct mbuf *control, struct lwp *l)
    333 {
    334 	int error = 0, rv;
    335 
    336 	switch (req) {
    337 	case PRU_ATTACH:
    338 	{
    339 		int news;
    340 
    341 		sosetlock(so);
    342 		if (so->so_snd.sb_hiwat == 0 || so->so_rcv.sb_hiwat == 0) {
    343 			error = soreserve(so, SOCKIN_SBSIZE, SOCKIN_SBSIZE);
    344 			if (error)
    345 				break;
    346 		}
    347 
    348 		news = rumpuser_net_socket(PF_INET, so->so_proto->pr_type,
    349 		    0, &error);
    350 		if (news == -1)
    351 			break;
    352 
    353 		if ((error = registersock(so, news)) != 0)
    354 			rumpuser_close(news, &error);
    355 
    356 		break;
    357 	}
    358 
    359 	case PRU_ACCEPT:
    360 		/* we do all the work in the worker thread */
    361 		break;
    362 
    363 	case PRU_BIND:
    364 		rumpuser_net_bind(SO2S(so), mtod(nam, const struct sockaddr *),
    365 		    sizeof(struct sockaddr_in), &error);
    366 		break;
    367 
    368 	case PRU_CONNECT:
    369 		/* don't bother to connect udp sockets, always sendmsg */
    370 		if (so->so_proto->pr_type == SOCK_DGRAM)
    371 			break;
    372 
    373 		rv = rumpuser_net_connect(SO2S(so),
    374 		    mtod(nam, struct sockaddr *), sizeof(struct sockaddr_in),
    375 		    &error);
    376 		if (rv == 0)
    377 			soisconnected(so);
    378 		break;
    379 
    380 	case PRU_LISTEN:
    381 		rumpuser_net_listen(SO2S(so), so->so_qlimit, &error);
    382 		break;
    383 
    384 	case PRU_SEND:
    385 	{
    386 		struct sockaddr *saddr;
    387 		struct msghdr mhdr;
    388 		struct iovec iov[16];
    389 		struct mbuf *m2;
    390 		size_t tot;
    391 		int i, s;
    392 
    393 		memset(&mhdr, 0, sizeof(mhdr));
    394 
    395 		tot = 0;
    396 		for (i = 0, m2 = m; m2; m2 = m2->m_next, i++) {
    397 			if (i > 16)
    398 				panic("lazy bum");
    399 			iov[i].iov_base = m2->m_data;
    400 			iov[i].iov_len = m2->m_len;
    401 			tot += m2->m_len;
    402 
    403 		}
    404 		mhdr.msg_iov = iov;
    405 		mhdr.msg_iovlen = i;
    406 		s = SO2S(so);
    407 
    408 		if (so->so_proto->pr_type == SOCK_DGRAM) {
    409 			saddr = mtod(nam, struct sockaddr *);
    410 			mhdr.msg_name = saddr;
    411 			mhdr.msg_namelen = saddr->sa_len;
    412 		}
    413 
    414 		rumpuser_net_sendmsg(s, &mhdr, 0, &error);
    415 
    416 		m_freem(m);
    417 		m_freem(control);
    418 
    419 		/* this assumes too many things to list.. buthey, testing */
    420 		if (!rump_threads)
    421 			sockin_process(so);
    422 	}
    423 		break;
    424 
    425 	case PRU_SHUTDOWN:
    426 		removesock(so);
    427 		break;
    428 
    429 	case PRU_SOCKADDR:
    430 	case PRU_PEERADDR:
    431 	{
    432 		int slen = nam->m_len;
    433 		enum rumpuser_getnametype which;
    434 
    435 		if (req == PRU_SOCKADDR)
    436 			which = RUMPUSER_SOCKNAME;
    437 		else
    438 			which = RUMPUSER_PEERNAME;
    439 		rumpuser_net_getname(SO2S(so),
    440 		    mtod(nam, struct sockaddr *), &slen, which, &error);
    441 		if (error == 0)
    442 			nam->m_len = slen;
    443 		break;
    444 	}
    445 
    446 	default:
    447 		panic("sockin_usrreq: IMPLEMENT ME, req %d not supported", req);
    448 	}
    449 
    450 	return error;
    451 }
    452 
    453 static int
    454 sockin_ctloutput(int op, struct socket *so, struct sockopt *sopt)
    455 {
    456 
    457 	/* XXX: we should also do something here */
    458 	return 0;
    459 }
    460