sockin.c revision 1.54 1 /* $NetBSD: sockin.c,v 1.54 2014/07/31 03:39:36 rtr Exp $ */
2
3 /*
4 * Copyright (c) 2008, 2009 Antti Kantee. All Rights Reserved.
5 *
6 * Redistribution and use in source and binary forms, with or without
7 * modification, are permitted provided that the following conditions
8 * are met:
9 * 1. Redistributions of source code must retain the above copyright
10 * notice, this list of conditions and the following disclaimer.
11 * 2. Redistributions in binary form must reproduce the above copyright
12 * notice, this list of conditions and the following disclaimer in the
13 * documentation and/or other materials provided with the distribution.
14 *
15 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
16 * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
17 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
18 * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
19 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
21 * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
23 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
24 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
25 * SUCH DAMAGE.
26 */
27
28 #include <sys/cdefs.h>
29 __KERNEL_RCSID(0, "$NetBSD: sockin.c,v 1.54 2014/07/31 03:39:36 rtr Exp $");
30
31 #include <sys/param.h>
32 #include <sys/condvar.h>
33 #include <sys/domain.h>
34 #include <sys/kmem.h>
35 #include <sys/kthread.h>
36 #include <sys/mbuf.h>
37 #include <sys/mutex.h>
38 #include <sys/once.h>
39 #include <sys/poll.h>
40 #include <sys/protosw.h>
41 #include <sys/queue.h>
42 #include <sys/socket.h>
43 #include <sys/socketvar.h>
44 #include <sys/time.h>
45
46 #include <net/bpf.h>
47 #include <net/if.h>
48 #include <net/radix.h>
49
50 #include <netinet/in.h>
51 #include <netinet/in_systm.h>
52 #include <netinet/ip.h>
53
54 #include <rump/rumpuser.h>
55
56 #include "rump_private.h"
57 #include "sockin_user.h"
58
59 /*
60 * An inet communication domain which uses the socket interface.
61 * Supports IPv4 & IPv6 UDP/TCP.
62 */
63
64 DOMAIN_DEFINE(sockindomain);
65 DOMAIN_DEFINE(sockin6domain);
66
67 static int sockin_do_init(void);
68 static void sockin_init(void);
69 static int sockin_attach(struct socket *, int);
70 static void sockin_detach(struct socket *);
71 static int sockin_accept(struct socket *, struct mbuf *);
72 static int sockin_bind(struct socket *, struct mbuf *);
73 static int sockin_listen(struct socket *);
74 static int sockin_connect(struct socket *, struct mbuf *);
75 static int sockin_disconnect(struct socket *);
76 static int sockin_shutdown(struct socket *);
77 static int sockin_abort(struct socket *);
78 static int sockin_ioctl(struct socket *, u_long, void *, struct ifnet *);
79 static int sockin_stat(struct socket *, struct stat *);
80 static int sockin_peeraddr(struct socket *, struct mbuf *);
81 static int sockin_sockaddr(struct socket *, struct mbuf *);
82 static int sockin_recvoob(struct socket *, struct mbuf *, int);
83 static int sockin_sendoob(struct socket *, struct mbuf *, struct mbuf *);
84 static int sockin_usrreq(struct socket *, int, struct mbuf *,
85 struct mbuf *, struct mbuf *, struct lwp *);
86 static int sockin_ctloutput(int op, struct socket *, struct sockopt *);
87
88 static const struct pr_usrreqs sockin_usrreqs = {
89 .pr_attach = sockin_attach,
90 .pr_detach = sockin_detach,
91 .pr_accept = sockin_accept,
92 .pr_bind = sockin_bind,
93 .pr_listen = sockin_listen,
94 .pr_connect = sockin_connect,
95 .pr_disconnect = sockin_disconnect,
96 .pr_shutdown = sockin_shutdown,
97 .pr_abort = sockin_abort,
98 .pr_ioctl = sockin_ioctl,
99 .pr_stat = sockin_stat,
100 .pr_peeraddr = sockin_peeraddr,
101 .pr_sockaddr = sockin_sockaddr,
102 .pr_recvoob = sockin_recvoob,
103 .pr_sendoob = sockin_sendoob,
104 .pr_generic = sockin_usrreq,
105 };
106
107 const struct protosw sockinsw[] = {
108 {
109 .pr_type = SOCK_DGRAM,
110 .pr_domain = &sockindomain,
111 .pr_protocol = IPPROTO_UDP,
112 .pr_flags = PR_ATOMIC|PR_ADDR,
113 .pr_usrreqs = &sockin_usrreqs,
114 .pr_ctloutput = sockin_ctloutput,
115 },
116 {
117 .pr_type = SOCK_STREAM,
118 .pr_domain = &sockindomain,
119 .pr_protocol = IPPROTO_TCP,
120 .pr_flags = PR_CONNREQUIRED|PR_WANTRCVD|PR_LISTEN|PR_ABRTACPTDIS,
121 .pr_usrreqs = &sockin_usrreqs,
122 .pr_ctloutput = sockin_ctloutput,
123 }};
124 const struct protosw sockin6sw[] = {
125 {
126 .pr_type = SOCK_DGRAM,
127 .pr_domain = &sockin6domain,
128 .pr_protocol = IPPROTO_UDP,
129 .pr_flags = PR_ATOMIC|PR_ADDR,
130 .pr_usrreqs = &sockin_usrreqs,
131 .pr_ctloutput = sockin_ctloutput,
132 },
133 {
134 .pr_type = SOCK_STREAM,
135 .pr_domain = &sockin6domain,
136 .pr_protocol = IPPROTO_TCP,
137 .pr_flags = PR_CONNREQUIRED|PR_WANTRCVD|PR_LISTEN|PR_ABRTACPTDIS,
138 .pr_usrreqs = &sockin_usrreqs,
139 .pr_ctloutput = sockin_ctloutput,
140 }};
141
142 struct domain sockindomain = {
143 .dom_family = PF_INET,
144 .dom_name = "socket_inet",
145 .dom_init = sockin_init,
146 .dom_externalize = NULL,
147 .dom_dispose = NULL,
148 .dom_protosw = sockinsw,
149 .dom_protoswNPROTOSW = &sockinsw[__arraycount(sockinsw)],
150 .dom_rtattach = rt_inithead,
151 .dom_rtoffset = 32,
152 .dom_maxrtkey = sizeof(struct sockaddr_in),
153 .dom_ifattach = NULL,
154 .dom_ifdetach = NULL,
155 .dom_ifqueues = { NULL },
156 .dom_link = { NULL },
157 .dom_mowner = MOWNER_INIT("",""),
158 .dom_rtcache = { NULL },
159 .dom_sockaddr_cmp = NULL
160 };
161 struct domain sockin6domain = {
162 .dom_family = PF_INET6,
163 .dom_name = "socket_inet6",
164 .dom_init = sockin_init,
165 .dom_externalize = NULL,
166 .dom_dispose = NULL,
167 .dom_protosw = sockin6sw,
168 .dom_protoswNPROTOSW = &sockin6sw[__arraycount(sockin6sw)],
169 .dom_rtattach = rt_inithead,
170 .dom_rtoffset = 32,
171 .dom_maxrtkey = sizeof(struct sockaddr_in6),
172 .dom_ifattach = NULL,
173 .dom_ifdetach = NULL,
174 .dom_ifqueues = { NULL },
175 .dom_link = { NULL },
176 .dom_mowner = MOWNER_INIT("",""),
177 .dom_rtcache = { NULL },
178 .dom_sockaddr_cmp = NULL
179 };
180
181 #define SO2S(so) ((intptr_t)(so->so_internal))
182 #define SOCKIN_SBSIZE 65536
183
184 struct sockin_unit {
185 struct socket *su_so;
186
187 LIST_ENTRY(sockin_unit) su_entries;
188 };
189 static LIST_HEAD(, sockin_unit) su_ent = LIST_HEAD_INITIALIZER(su_ent);
190 static kmutex_t su_mtx;
191 static bool rebuild;
192 static int nsock;
193
194 /* XXX: for the bpf hack */
195 static struct ifnet sockin_if;
196 int ifpromisc(struct ifnet *ifp, int pswitch) { return 0; }
197
198 static int
199 registersock(struct socket *so, int news)
200 {
201 struct sockin_unit *su;
202
203 su = kmem_alloc(sizeof(*su), KM_NOSLEEP);
204 if (!su)
205 return ENOMEM;
206
207 so->so_internal = (void *)(intptr_t)news;
208 su->su_so = so;
209
210 mutex_enter(&su_mtx);
211 LIST_INSERT_HEAD(&su_ent, su, su_entries);
212 nsock++;
213 rebuild = true;
214 mutex_exit(&su_mtx);
215
216 return 0;
217 }
218
219 static void
220 removesock(struct socket *so)
221 {
222 struct sockin_unit *su_iter;
223
224 mutex_enter(&su_mtx);
225 LIST_FOREACH(su_iter, &su_ent, su_entries) {
226 if (su_iter->su_so == so)
227 break;
228 }
229 if (!su_iter)
230 panic("no such socket");
231
232 LIST_REMOVE(su_iter, su_entries);
233 nsock--;
234 rebuild = true;
235 mutex_exit(&su_mtx);
236
237 rumpuser_close(SO2S(su_iter->su_so));
238 kmem_free(su_iter, sizeof(*su_iter));
239 }
240
241 static void
242 sockin_process(struct socket *so)
243 {
244 struct sockaddr_in6 from;
245 struct iovec io;
246 struct msghdr rmsg;
247 struct mbuf *m;
248 size_t n, plen;
249 int error;
250
251 m = m_gethdr(M_WAIT, MT_DATA);
252 if (so->so_proto->pr_type == SOCK_DGRAM) {
253 plen = IP_MAXPACKET;
254 MEXTMALLOC(m, plen, M_DONTWAIT);
255 } else {
256 plen = MCLBYTES;
257 MCLGET(m, M_DONTWAIT);
258 }
259 if ((m->m_flags & M_EXT) == 0) {
260 m_freem(m);
261 return;
262 }
263
264 memset(&rmsg, 0, sizeof(rmsg));
265 io.iov_base = mtod(m, void *);
266 io.iov_len = plen;
267 rmsg.msg_iov = &io;
268 rmsg.msg_iovlen = 1;
269 rmsg.msg_name = (struct sockaddr *)&from;
270 rmsg.msg_namelen = sizeof(from);
271
272 error = rumpcomp_sockin_recvmsg(SO2S(so), &rmsg, 0, &n);
273 if (error || n == 0) {
274 m_freem(m);
275
276 /* Treat a TCP socket a goner */
277 if (error != EAGAIN && so->so_proto->pr_type == SOCK_STREAM) {
278 mutex_enter(softnet_lock);
279 soisdisconnected(so);
280 mutex_exit(softnet_lock);
281 removesock(so);
282 }
283 return;
284 }
285 m->m_len = m->m_pkthdr.len = n;
286
287 bpf_mtap_af(&sockin_if, AF_UNSPEC, m);
288
289 mutex_enter(softnet_lock);
290 if (so->so_proto->pr_type == SOCK_DGRAM) {
291 if (!sbappendaddr(&so->so_rcv, rmsg.msg_name, m, NULL)) {
292 m_freem(m);
293 }
294 } else {
295 sbappendstream(&so->so_rcv, m);
296 }
297
298 sorwakeup(so);
299 mutex_exit(softnet_lock);
300 }
301
302 static void
303 sockin_waccept(struct socket *so)
304 {
305 struct socket *nso;
306 struct sockaddr_in6 sin;
307 int news, error, slen;
308
309 slen = sizeof(sin);
310 error = rumpcomp_sockin_accept(SO2S(so), (struct sockaddr *)&sin,
311 &slen, &news);
312 if (error)
313 return;
314
315 mutex_enter(softnet_lock);
316 nso = sonewconn(so, true);
317 if (nso == NULL)
318 goto errout;
319 if (registersock(nso, news) != 0)
320 goto errout;
321 mutex_exit(softnet_lock);
322 return;
323
324 errout:
325 rumpuser_close(news);
326 if (nso)
327 soclose(nso);
328 mutex_exit(softnet_lock);
329 }
330
331 #define POLLTIMEOUT 100 /* check for new entries every 100ms */
332
333 /* XXX: doesn't handle socket (kernel) locking properly? */
334 static void
335 sockinworker(void *arg)
336 {
337 struct pollfd *pfds = NULL, *npfds;
338 struct sockin_unit *su_iter;
339 struct socket *so;
340 int cursock = 0, i, rv, error;
341
342 /*
343 * Loop reading requests. Check for new sockets periodically
344 * (could be smarter, but I'm lazy).
345 */
346 for (;;) {
347 if (rebuild) {
348 npfds = NULL;
349 mutex_enter(&su_mtx);
350 if (nsock)
351 npfds = kmem_alloc(nsock * sizeof(*npfds),
352 KM_NOSLEEP);
353 if (npfds || nsock == 0) {
354 if (pfds)
355 kmem_free(pfds, cursock*sizeof(*pfds));
356 pfds = npfds;
357 cursock = nsock;
358 rebuild = false;
359
360 i = 0;
361 LIST_FOREACH(su_iter, &su_ent, su_entries) {
362 pfds[i].fd = SO2S(su_iter->su_so);
363 pfds[i].events = POLLIN;
364 pfds[i].revents = 0;
365 i++;
366 }
367 KASSERT(i == nsock);
368 }
369 mutex_exit(&su_mtx);
370 }
371
372 /* find affected sockets & process */
373 error = rumpcomp_sockin_poll(pfds, cursock, POLLTIMEOUT, &rv);
374 for (i = 0; i < cursock && rv > 0 && error == 0; i++) {
375 if (pfds[i].revents & POLLIN) {
376 mutex_enter(&su_mtx);
377 LIST_FOREACH(su_iter, &su_ent, su_entries) {
378 if (SO2S(su_iter->su_so)==pfds[i].fd) {
379 so = su_iter->su_so;
380 mutex_exit(&su_mtx);
381 if(so->so_options&SO_ACCEPTCONN)
382 sockin_waccept(so);
383 else
384 sockin_process(so);
385 mutex_enter(&su_mtx);
386 break;
387 }
388 }
389 /* if we can't find it, just wing it */
390 KASSERT(rebuild || su_iter);
391 mutex_exit(&su_mtx);
392 pfds[i].revents = 0;
393 rv--;
394 i = -1;
395 continue;
396 }
397
398 /* something else? ignore */
399 if (pfds[i].revents) {
400 pfds[i].revents = 0;
401 rv--;
402 }
403 }
404 KASSERT(rv <= 0);
405 }
406
407 }
408
409 static int
410 sockin_do_init(void)
411 {
412 int rv;
413
414 if (rump_threads) {
415 if ((rv = kthread_create(PRI_NONE, 0, NULL, sockinworker,
416 NULL, NULL, "sockwork")) != 0)
417 panic("sockin_init: could not create worker thread\n");
418 } else {
419 printf("sockin_init: no threads => no worker thread\n");
420 }
421 mutex_init(&su_mtx, MUTEX_DEFAULT, IPL_NONE);
422 strlcpy(sockin_if.if_xname, "sockin0", sizeof(sockin_if.if_xname));
423 bpf_attach(&sockin_if, DLT_NULL, 0);
424 return 0;
425 }
426
427 static void
428 sockin_init(void)
429 {
430 static ONCE_DECL(init);
431
432 RUN_ONCE(&init, sockin_do_init);
433 }
434
435 static int
436 sockin_attach(struct socket *so, int proto)
437 {
438 const int type = so->so_proto->pr_type;
439 int error, news, family;
440
441 sosetlock(so);
442 if (so->so_snd.sb_hiwat == 0 || so->so_rcv.sb_hiwat == 0) {
443 error = soreserve(so, SOCKIN_SBSIZE, SOCKIN_SBSIZE);
444 if (error)
445 return error;
446 }
447
448 family = so->so_proto->pr_domain->dom_family;
449 KASSERT(family == PF_INET || family == PF_INET6);
450 error = rumpcomp_sockin_socket(family, type, 0, &news);
451 if (error)
452 return error;
453
454 /* For UDP sockets, make sure we can send/recv maximum. */
455 if (type == SOCK_DGRAM) {
456 int sbsize = SOCKIN_SBSIZE;
457 error = rumpcomp_sockin_setsockopt(news,
458 SOL_SOCKET, SO_SNDBUF,
459 &sbsize, sizeof(sbsize));
460 sbsize = SOCKIN_SBSIZE;
461 error = rumpcomp_sockin_setsockopt(news,
462 SOL_SOCKET, SO_RCVBUF,
463 &sbsize, sizeof(sbsize));
464 }
465
466 if ((error = registersock(so, news)) != 0)
467 rumpuser_close(news);
468
469 return error;
470 }
471
472 static void
473 sockin_detach(struct socket *so)
474 {
475 panic("sockin_detach: IMPLEMENT ME\n");
476 }
477
478 static int
479 sockin_accept(struct socket *so, struct mbuf *nam)
480 {
481 KASSERT(solocked(so));
482
483 /* we do all the work in the worker thread */
484 return 0;
485 }
486
487 static int
488 sockin_bind(struct socket *so, struct mbuf *nam)
489 {
490 KASSERT(solocked(so));
491 KASSERT(nam != NULL);
492
493 return rumpcomp_sockin_bind(SO2S(so),
494 mtod(nam, const struct sockaddr *),
495 nam->m_len);
496 }
497
498 static int
499 sockin_listen(struct socket *so)
500 {
501 KASSERT(solocked(so));
502
503 return rumpcomp_sockin_listen(SO2S(so), so->so_qlimit);
504 }
505
506 static int
507 sockin_connect(struct socket *so, struct mbuf *nam)
508 {
509 int error = 0;
510
511 KASSERT(solocked(so));
512 KASSERT(nam != NULL);
513
514 error = rumpcomp_sockin_connect(SO2S(so),
515 mtod(nam, struct sockaddr *), nam->m_len);
516 if (error == 0)
517 soisconnected(so);
518
519 return error;
520 }
521
522 static int
523 sockin_disconnect(struct socket *so)
524 {
525 KASSERT(solocked(so));
526
527 panic("sockin_disconnect: IMPLEMENT ME, disconnect not supported");
528 }
529
530 static int
531 sockin_shutdown(struct socket *so)
532 {
533 KASSERT(solocked(so));
534
535 removesock(so);
536 return 0;
537 }
538
539 static int
540 sockin_abort(struct socket *so)
541 {
542 KASSERT(solocked(so));
543
544 panic("sockin_abort: IMPLEMENT ME, abort not supported");
545 }
546
547 static int
548 sockin_ioctl(struct socket *so, u_long cmd, void *nam, struct ifnet *ifp)
549 {
550 return ENOTTY;
551 }
552
553 static int
554 sockin_stat(struct socket *so, struct stat *ub)
555 {
556 KASSERT(solocked(so));
557
558 return 0;
559 }
560
561 static int
562 sockin_peeraddr(struct socket *so, struct mbuf *nam)
563 {
564 KASSERT(solocked(so));
565
566 int error = 0;
567 int slen = nam->m_len;
568
569 error = rumpcomp_sockin_getname(SO2S(so),
570 mtod(nam, struct sockaddr *), &slen, RUMPCOMP_SOCKIN_PEERNAME);
571 if (error == 0)
572 nam->m_len = slen;
573 return error;
574 }
575
576 static int
577 sockin_sockaddr(struct socket *so, struct mbuf *nam)
578 {
579 KASSERT(solocked(so));
580
581 int error = 0;
582 int slen = nam->m_len;
583
584 error = rumpcomp_sockin_getname(SO2S(so),
585 mtod(nam, struct sockaddr *), &slen, RUMPCOMP_SOCKIN_SOCKNAME);
586 if (error == 0)
587 nam->m_len = slen;
588 return error;
589 }
590
591 static int
592 sockin_recvoob(struct socket *so, struct mbuf *m, int flags)
593 {
594 KASSERT(solocked(so));
595
596 panic("sockin_recvoob: IMPLEMENT ME, recvoob not supported");
597 }
598
599 static int
600 sockin_sendoob(struct socket *so, struct mbuf *m, struct mbuf *control)
601 {
602 KASSERT(solocked(so));
603
604 panic("sockin_sendoob: IMPLEMENT ME, sendoob not supported");
605 }
606
607 static int
608 sockin_usrreq(struct socket *so, int req, struct mbuf *m, struct mbuf *nam,
609 struct mbuf *control, struct lwp *l)
610 {
611 int error = 0;
612
613 KASSERT(req != PRU_ACCEPT);
614 KASSERT(req != PRU_BIND);
615 KASSERT(req != PRU_LISTEN);
616 KASSERT(req != PRU_CONNECT);
617 KASSERT(req != PRU_DISCONNECT);
618 KASSERT(req != PRU_SHUTDOWN);
619 KASSERT(req != PRU_ABORT);
620 KASSERT(req != PRU_CONTROL);
621 KASSERT(req != PRU_SENSE);
622 KASSERT(req != PRU_PEERADDR);
623 KASSERT(req != PRU_SOCKADDR);
624 KASSERT(req != PRU_RCVOOB);
625 KASSERT(req != PRU_SENDOOB);
626
627 switch (req) {
628 case PRU_SEND:
629 {
630 struct sockaddr *saddr;
631 struct msghdr mhdr;
632 size_t iov_max, i;
633 struct iovec iov_buf[32], *iov;
634 struct mbuf *m2;
635 size_t tot, n;
636 int s;
637
638 bpf_mtap_af(&sockin_if, AF_UNSPEC, m);
639
640 memset(&mhdr, 0, sizeof(mhdr));
641
642 iov_max = 0;
643 for (m2 = m; m2 != NULL; m2 = m2->m_next) {
644 iov_max++;
645 }
646
647 if (iov_max <= __arraycount(iov_buf)) {
648 iov = iov_buf;
649 } else {
650 iov = kmem_alloc(sizeof(struct iovec) * iov_max,
651 KM_SLEEP);
652 }
653
654 tot = 0;
655 for (i = 0, m2 = m; m2 != NULL; m2 = m2->m_next, i++) {
656 iov[i].iov_base = m2->m_data;
657 iov[i].iov_len = m2->m_len;
658 tot += m2->m_len;
659 }
660 mhdr.msg_iov = iov;
661 mhdr.msg_iovlen = i;
662 s = SO2S(so);
663
664 if (nam != NULL) {
665 saddr = mtod(nam, struct sockaddr *);
666 mhdr.msg_name = saddr;
667 mhdr.msg_namelen = saddr->sa_len;
668 }
669
670 rumpcomp_sockin_sendmsg(s, &mhdr, 0, &n);
671
672 if (iov != iov_buf)
673 kmem_free(iov, sizeof(struct iovec) * iov_max);
674
675 m_freem(m);
676 m_freem(control);
677
678 /* this assumes too many things to list.. buthey, testing */
679 if (!rump_threads)
680 sockin_process(so);
681 }
682 break;
683
684 default:
685 panic("sockin_usrreq: IMPLEMENT ME, req %d not supported", req);
686 }
687
688 return error;
689 }
690
691 static int
692 sockin_ctloutput(int op, struct socket *so, struct sockopt *sopt)
693 {
694
695 return rumpcomp_sockin_setsockopt(SO2S(so), sopt->sopt_level,
696 sopt->sopt_name, sopt->sopt_data, sopt->sopt_size);
697 }
698
699 int sockin_unavailable(void);
700 int
701 sockin_unavailable(void)
702 {
703
704 panic("interface not available in with sockin");
705 }
706 __strong_alias(rtrequest,sockin_unavailable);
707 __strong_alias(ifunit,sockin_unavailable);
708 __strong_alias(ifreq_setaddr,sockin_unavailable);
709