hijack.c revision 1.8 1 1.8 pooka /* $NetBSD: hijack.c,v 1.8 2011/01/17 16:27:54 pooka Exp $ */
2 1.1 pooka
3 1.1 pooka /*-
4 1.1 pooka * Copyright (c) 2011 Antti Kantee. All Rights Reserved.
5 1.1 pooka *
6 1.1 pooka * Redistribution and use in source and binary forms, with or without
7 1.1 pooka * modification, are permitted provided that the following conditions
8 1.1 pooka * are met:
9 1.1 pooka * 1. Redistributions of source code must retain the above copyright
10 1.1 pooka * notice, this list of conditions and the following disclaimer.
11 1.1 pooka * 2. Redistributions in binary form must reproduce the above copyright
12 1.1 pooka * notice, this list of conditions and the following disclaimer in the
13 1.1 pooka * documentation and/or other materials provided with the distribution.
14 1.1 pooka *
15 1.1 pooka * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
16 1.1 pooka * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
17 1.1 pooka * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
18 1.1 pooka * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
19 1.1 pooka * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20 1.1 pooka * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
21 1.1 pooka * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22 1.1 pooka * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
23 1.1 pooka * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
24 1.1 pooka * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
25 1.1 pooka * SUCH DAMAGE.
26 1.1 pooka */
27 1.1 pooka
28 1.1 pooka #include <sys/cdefs.h>
29 1.8 pooka __RCSID("$NetBSD: hijack.c,v 1.8 2011/01/17 16:27:54 pooka Exp $");
30 1.1 pooka
31 1.1 pooka #include <sys/param.h>
32 1.1 pooka #include <sys/types.h>
33 1.1 pooka #include <sys/ioctl.h>
34 1.1 pooka #include <sys/socket.h>
35 1.1 pooka #include <sys/poll.h>
36 1.1 pooka
37 1.1 pooka #include <rump/rumpclient.h>
38 1.1 pooka #include <rump/rump_syscalls.h>
39 1.1 pooka
40 1.1 pooka #include <assert.h>
41 1.1 pooka #include <dlfcn.h>
42 1.1 pooka #include <err.h>
43 1.1 pooka #include <errno.h>
44 1.1 pooka #include <fcntl.h>
45 1.1 pooka #include <poll.h>
46 1.1 pooka #include <pthread.h>
47 1.3 pooka #include <signal.h>
48 1.1 pooka #include <stdarg.h>
49 1.8 pooka #include <stdbool.h>
50 1.1 pooka #include <stdio.h>
51 1.1 pooka #include <stdlib.h>
52 1.3 pooka #include <time.h>
53 1.1 pooka #include <unistd.h>
54 1.1 pooka
55 1.1 pooka enum { RUMPCALL_SOCKET, RUMPCALL_ACCEPT, RUMPCALL_BIND, RUMPCALL_CONNECT,
56 1.1 pooka RUMPCALL_GETPEERNAME, RUMPCALL_GETSOCKNAME, RUMPCALL_LISTEN,
57 1.1 pooka RUMPCALL_RECVFROM, RUMPCALL_RECVMSG,
58 1.1 pooka RUMPCALL_SENDTO, RUMPCALL_SENDMSG,
59 1.1 pooka RUMPCALL_GETSOCKOPT, RUMPCALL_SETSOCKOPT,
60 1.1 pooka RUMPCALL_SHUTDOWN,
61 1.1 pooka RUMPCALL_READ, RUMPCALL_READV,
62 1.1 pooka RUMPCALL_WRITE, RUMPCALL_WRITEV,
63 1.1 pooka RUMPCALL_IOCTL, RUMPCALL_FCNTL,
64 1.1 pooka RUMPCALL_CLOSE,
65 1.4 pooka RUMPCALL_POLLTS,
66 1.1 pooka RUMPCALL__NUM
67 1.1 pooka };
68 1.1 pooka
69 1.8 pooka #define RSYS_STRING(a) __STRING(a)
70 1.8 pooka #define RSYS_NAME(a) RSYS_STRING(__CONCAT(RUMP_SYS_RENAME_,a))
71 1.8 pooka
72 1.1 pooka const char *sysnames[] = {
73 1.8 pooka RSYS_NAME(SOCKET),
74 1.8 pooka RSYS_NAME(ACCEPT),
75 1.8 pooka RSYS_NAME(BIND),
76 1.8 pooka RSYS_NAME(CONNECT),
77 1.8 pooka RSYS_NAME(GETPEERNAME),
78 1.8 pooka RSYS_NAME(GETSOCKNAME),
79 1.8 pooka RSYS_NAME(LISTEN),
80 1.8 pooka RSYS_NAME(RECVFROM),
81 1.8 pooka RSYS_NAME(RECVMSG),
82 1.8 pooka RSYS_NAME(SENDTO),
83 1.8 pooka RSYS_NAME(SENDMSG),
84 1.8 pooka RSYS_NAME(GETSOCKOPT),
85 1.8 pooka RSYS_NAME(SETSOCKOPT),
86 1.8 pooka RSYS_NAME(SHUTDOWN),
87 1.8 pooka RSYS_NAME(READ),
88 1.8 pooka RSYS_NAME(READV),
89 1.8 pooka RSYS_NAME(WRITE),
90 1.8 pooka RSYS_NAME(WRITEV),
91 1.8 pooka RSYS_NAME(IOCTL),
92 1.8 pooka RSYS_NAME(FCNTL),
93 1.8 pooka RSYS_NAME(CLOSE),
94 1.8 pooka RSYS_NAME(POLLTS),
95 1.1 pooka };
96 1.1 pooka
97 1.7 pooka static int (*host_socket)(int, int, int);
98 1.7 pooka static int (*host_connect)(int, const struct sockaddr *, socklen_t);
99 1.7 pooka static int (*host_bind)(int, const struct sockaddr *, socklen_t);
100 1.7 pooka static int (*host_listen)(int, int);
101 1.7 pooka static int (*host_accept)(int, struct sockaddr *, socklen_t *);
102 1.7 pooka static int (*host_getpeername)(int, struct sockaddr *, socklen_t *);
103 1.7 pooka static int (*host_getsockname)(int, struct sockaddr *, socklen_t *);
104 1.7 pooka static int (*host_setsockopt)(int, int, int, const void *, socklen_t);
105 1.7 pooka
106 1.1 pooka static ssize_t (*host_read)(int, void *, size_t);
107 1.1 pooka static ssize_t (*host_readv)(int, const struct iovec *, int);
108 1.1 pooka static ssize_t (*host_write)(int, const void *, size_t);
109 1.1 pooka static ssize_t (*host_writev)(int, const struct iovec *, int);
110 1.1 pooka static int (*host_ioctl)(int, unsigned long, ...);
111 1.1 pooka static int (*host_fcntl)(int, int, ...);
112 1.1 pooka static int (*host_close)(int);
113 1.3 pooka static int (*host_pollts)(struct pollfd *, nfds_t,
114 1.3 pooka const struct timespec *, const sigset_t *);
115 1.2 pooka static pid_t (*host_fork)(void);
116 1.2 pooka static int (*host_dup2)(int, int);
117 1.1 pooka
118 1.1 pooka static void *rumpcalls[RUMPCALL__NUM];
119 1.1 pooka
120 1.1 pooka /*
121 1.1 pooka * This is called from librumpclient in case of LD_PRELOAD.
122 1.1 pooka * It ensures correct RTLD_NEXT.
123 1.1 pooka */
124 1.1 pooka static void *
125 1.1 pooka hijackdlsym(void *handle, const char *symbol)
126 1.1 pooka {
127 1.1 pooka
128 1.1 pooka return dlsym(handle, symbol);
129 1.1 pooka }
130 1.1 pooka
131 1.7 pooka /* low calorie sockets? */
132 1.7 pooka static bool hostlocalsockets = false;
133 1.7 pooka
134 1.1 pooka static void __attribute__((constructor))
135 1.1 pooka rcinit(void)
136 1.1 pooka {
137 1.1 pooka int (*rumpcinit)(void);
138 1.1 pooka void **rumpcdlsym;
139 1.1 pooka void *hand;
140 1.1 pooka int i;
141 1.1 pooka
142 1.1 pooka hand = dlopen("librumpclient.so", RTLD_LAZY|RTLD_GLOBAL);
143 1.1 pooka if (!hand)
144 1.1 pooka err(1, "cannot open librumpclient.so");
145 1.1 pooka rumpcinit = dlsym(hand, "rumpclient_init");
146 1.1 pooka _DIAGASSERT(rumpcinit);
147 1.1 pooka
148 1.1 pooka rumpcdlsym = dlsym(hand, "rumpclient_dlsym");
149 1.1 pooka *rumpcdlsym = hijackdlsym;
150 1.1 pooka
151 1.7 pooka host_socket = dlsym(RTLD_NEXT, "__socket30");
152 1.7 pooka host_listen = dlsym(RTLD_NEXT, "listen");
153 1.7 pooka host_connect = dlsym(RTLD_NEXT, "connect");
154 1.7 pooka host_bind = dlsym(RTLD_NEXT, "bind");
155 1.7 pooka host_accept = dlsym(RTLD_NEXT, "accept");
156 1.7 pooka host_getpeername = dlsym(RTLD_NEXT, "getpeername");
157 1.7 pooka host_getsockname = dlsym(RTLD_NEXT, "getsockname");
158 1.7 pooka host_setsockopt = dlsym(RTLD_NEXT, "setsockopt");
159 1.7 pooka
160 1.1 pooka host_read = dlsym(RTLD_NEXT, "read");
161 1.1 pooka host_readv = dlsym(RTLD_NEXT, "readv");
162 1.1 pooka host_write = dlsym(RTLD_NEXT, "write");
163 1.1 pooka host_writev = dlsym(RTLD_NEXT, "writev");
164 1.1 pooka host_ioctl = dlsym(RTLD_NEXT, "ioctl");
165 1.1 pooka host_fcntl = dlsym(RTLD_NEXT, "fcntl");
166 1.1 pooka host_close = dlsym(RTLD_NEXT, "close");
167 1.3 pooka host_pollts = dlsym(RTLD_NEXT, "pollts");
168 1.2 pooka host_fork = dlsym(RTLD_NEXT, "fork");
169 1.2 pooka host_dup2 = dlsym(RTLD_NEXT, "dup2");
170 1.1 pooka
171 1.1 pooka for (i = 0; i < RUMPCALL__NUM; i++) {
172 1.8 pooka rumpcalls[i] = dlsym(hand, sysnames[i]);
173 1.1 pooka if (!rumpcalls[i]) {
174 1.8 pooka fprintf(stderr, "rumphijack: cannot find symbol: %s\n",
175 1.8 pooka sysnames[i]);
176 1.1 pooka exit(1);
177 1.1 pooka }
178 1.1 pooka }
179 1.1 pooka
180 1.1 pooka if (rumpcinit() == -1)
181 1.1 pooka err(1, "rumpclient init");
182 1.1 pooka }
183 1.1 pooka
184 1.5 pooka static unsigned dup2mask;
185 1.5 pooka #define ISDUP2D(fd) (((fd+1) & dup2mask) == ((fd)+1))
186 1.5 pooka
187 1.1 pooka //#define DEBUGJACK
188 1.1 pooka #ifdef DEBUGJACK
189 1.5 pooka #define DPRINTF(x) mydprintf x
190 1.5 pooka static void
191 1.5 pooka mydprintf(const char *fmt, ...)
192 1.5 pooka {
193 1.5 pooka va_list ap;
194 1.5 pooka
195 1.5 pooka if (ISDUP2D(STDERR_FILENO))
196 1.5 pooka return;
197 1.5 pooka
198 1.5 pooka va_start(ap, fmt);
199 1.5 pooka vfprintf(stderr, fmt, ap);
200 1.5 pooka va_end(ap);
201 1.5 pooka }
202 1.5 pooka
203 1.1 pooka #else
204 1.1 pooka #define DPRINTF(x)
205 1.1 pooka #endif
206 1.1 pooka
207 1.2 pooka /* XXX: need runtime selection. low for now due to FD_SETSIZE */
208 1.2 pooka #define HIJACK_FDOFF 128
209 1.2 pooka #define HIJACK_SELECT 128 /* XXX */
210 1.2 pooka #define HIJACK_ASSERT 128 /* XXX */
211 1.2 pooka static int
212 1.2 pooka fd_rump2host(int fd)
213 1.2 pooka {
214 1.2 pooka
215 1.2 pooka if (fd == -1)
216 1.2 pooka return fd;
217 1.2 pooka
218 1.2 pooka if (!ISDUP2D(fd))
219 1.2 pooka fd += HIJACK_FDOFF;
220 1.2 pooka
221 1.2 pooka return fd;
222 1.2 pooka }
223 1.2 pooka
224 1.2 pooka static int
225 1.2 pooka fd_host2rump(int fd)
226 1.2 pooka {
227 1.2 pooka
228 1.2 pooka if (!ISDUP2D(fd))
229 1.2 pooka fd -= HIJACK_FDOFF;
230 1.2 pooka return fd;
231 1.2 pooka }
232 1.2 pooka
233 1.2 pooka static bool
234 1.2 pooka fd_isrump(int fd)
235 1.2 pooka {
236 1.2 pooka
237 1.2 pooka return ISDUP2D(fd) || fd >= HIJACK_FDOFF;
238 1.2 pooka }
239 1.2 pooka
240 1.2 pooka #define assertfd(_fd_) assert(ISDUP2D(_fd_) || (_fd_) >= HIJACK_ASSERT)
241 1.2 pooka #undef HIJACK_FDOFF
242 1.2 pooka
243 1.1 pooka /*
244 1.1 pooka * Following wrappers always call the rump kernel.
245 1.1 pooka */
246 1.1 pooka
247 1.1 pooka int __socket30(int, int, int);
248 1.1 pooka int
249 1.1 pooka __socket30(int domain, int type, int protocol)
250 1.1 pooka {
251 1.1 pooka int (*rc_socket)(int, int, int);
252 1.1 pooka int fd;
253 1.7 pooka bool dohost;
254 1.7 pooka
255 1.7 pooka dohost = hostlocalsockets && (domain == AF_LOCAL);
256 1.1 pooka
257 1.7 pooka if (dohost)
258 1.7 pooka rc_socket = host_socket;
259 1.7 pooka else
260 1.7 pooka rc_socket = rumpcalls[RUMPCALL_SOCKET];
261 1.1 pooka fd = rc_socket(domain, type, protocol);
262 1.2 pooka
263 1.7 pooka if (!dohost)
264 1.7 pooka fd = fd_rump2host(fd);
265 1.7 pooka DPRINTF(("socket <- %d\n", fd));
266 1.2 pooka
267 1.7 pooka return fd;
268 1.1 pooka }
269 1.1 pooka
270 1.1 pooka int
271 1.1 pooka accept(int s, struct sockaddr *addr, socklen_t *addrlen)
272 1.1 pooka {
273 1.1 pooka int (*rc_accept)(int, struct sockaddr *, socklen_t *);
274 1.1 pooka int fd;
275 1.7 pooka bool isrump;
276 1.7 pooka
277 1.7 pooka isrump = fd_isrump(s);
278 1.1 pooka
279 1.2 pooka DPRINTF(("accept -> %d", s));
280 1.7 pooka if (isrump) {
281 1.7 pooka rc_accept = rumpcalls[RUMPCALL_ACCEPT];
282 1.7 pooka s = fd_host2rump(s);
283 1.7 pooka } else {
284 1.7 pooka rc_accept = host_accept;
285 1.7 pooka }
286 1.7 pooka fd = rc_accept(s, addr, addrlen);
287 1.7 pooka if (fd != -1 && isrump)
288 1.7 pooka fd = fd_rump2host(fd);
289 1.7 pooka
290 1.7 pooka DPRINTF((" <- %d\n", fd));
291 1.2 pooka
292 1.7 pooka return fd;
293 1.1 pooka }
294 1.1 pooka
295 1.1 pooka int
296 1.1 pooka bind(int s, const struct sockaddr *name, socklen_t namelen)
297 1.1 pooka {
298 1.1 pooka int (*rc_bind)(int, const struct sockaddr *, socklen_t);
299 1.1 pooka
300 1.2 pooka DPRINTF(("bind -> %d\n", s));
301 1.7 pooka if (fd_isrump(s)) {
302 1.7 pooka rc_bind = rumpcalls[RUMPCALL_BIND];
303 1.7 pooka s = fd_host2rump(s);
304 1.7 pooka } else {
305 1.7 pooka rc_bind = host_bind;
306 1.7 pooka }
307 1.7 pooka return rc_bind(s, name, namelen);
308 1.1 pooka }
309 1.1 pooka
310 1.1 pooka int
311 1.1 pooka connect(int s, const struct sockaddr *name, socklen_t namelen)
312 1.1 pooka {
313 1.1 pooka int (*rc_connect)(int, const struct sockaddr *, socklen_t);
314 1.1 pooka
315 1.2 pooka DPRINTF(("connect -> %d\n", s));
316 1.7 pooka if (fd_isrump(s)) {
317 1.7 pooka rc_connect = rumpcalls[RUMPCALL_CONNECT];
318 1.7 pooka s = fd_host2rump(s);
319 1.7 pooka } else {
320 1.7 pooka rc_connect = host_connect;
321 1.7 pooka }
322 1.2 pooka
323 1.7 pooka return rc_connect(s, name, namelen);
324 1.1 pooka }
325 1.1 pooka
326 1.1 pooka int
327 1.1 pooka getpeername(int s, struct sockaddr *name, socklen_t *namelen)
328 1.1 pooka {
329 1.1 pooka int (*rc_getpeername)(int, struct sockaddr *, socklen_t *);
330 1.1 pooka
331 1.2 pooka DPRINTF(("getpeername -> %d\n", s));
332 1.7 pooka if (fd_isrump(s)) {
333 1.7 pooka rc_getpeername = rumpcalls[RUMPCALL_GETPEERNAME];
334 1.7 pooka s = fd_host2rump(s);
335 1.7 pooka } else {
336 1.7 pooka rc_getpeername = host_getpeername;
337 1.7 pooka }
338 1.7 pooka return rc_getpeername(s, name, namelen);
339 1.1 pooka }
340 1.1 pooka
341 1.1 pooka int
342 1.1 pooka getsockname(int s, struct sockaddr *name, socklen_t *namelen)
343 1.1 pooka {
344 1.1 pooka int (*rc_getsockname)(int, struct sockaddr *, socklen_t *);
345 1.1 pooka
346 1.2 pooka DPRINTF(("getsockname -> %d\n", s));
347 1.7 pooka if (fd_isrump(s)) {
348 1.7 pooka rc_getsockname = rumpcalls[RUMPCALL_GETSOCKNAME];
349 1.7 pooka s = fd_host2rump(s);
350 1.7 pooka } else {
351 1.7 pooka rc_getsockname = host_getsockname;
352 1.7 pooka }
353 1.7 pooka return rc_getsockname(s, name, namelen);
354 1.1 pooka }
355 1.1 pooka
356 1.1 pooka int
357 1.1 pooka listen(int s, int backlog)
358 1.1 pooka {
359 1.1 pooka int (*rc_listen)(int, int);
360 1.1 pooka
361 1.2 pooka DPRINTF(("listen -> %d\n", s));
362 1.7 pooka if (fd_isrump(s)) {
363 1.7 pooka rc_listen = rumpcalls[RUMPCALL_LISTEN];
364 1.7 pooka s = fd_host2rump(s);
365 1.7 pooka } else {
366 1.7 pooka rc_listen = host_listen;
367 1.7 pooka }
368 1.7 pooka return rc_listen(s, backlog);
369 1.1 pooka }
370 1.1 pooka
371 1.1 pooka ssize_t
372 1.1 pooka recv(int s, void *buf, size_t len, int flags)
373 1.1 pooka {
374 1.1 pooka
375 1.1 pooka return recvfrom(s, buf, len, flags, NULL, NULL);
376 1.1 pooka }
377 1.1 pooka
378 1.1 pooka ssize_t
379 1.1 pooka recvfrom(int s, void *buf, size_t len, int flags, struct sockaddr *from,
380 1.1 pooka socklen_t *fromlen)
381 1.1 pooka {
382 1.1 pooka int (*rc_recvfrom)(int, void *, size_t, int,
383 1.1 pooka struct sockaddr *, socklen_t *);
384 1.1 pooka
385 1.1 pooka DPRINTF(("recvfrom\n"));
386 1.1 pooka assertfd(s);
387 1.1 pooka rc_recvfrom = rumpcalls[RUMPCALL_RECVFROM];
388 1.2 pooka return rc_recvfrom(fd_host2rump(s), buf, len, flags, from, fromlen);
389 1.1 pooka }
390 1.1 pooka
391 1.1 pooka ssize_t
392 1.1 pooka recvmsg(int s, struct msghdr *msg, int flags)
393 1.1 pooka {
394 1.1 pooka int (*rc_recvmsg)(int, struct msghdr *, int);
395 1.1 pooka
396 1.1 pooka DPRINTF(("recvmsg\n"));
397 1.1 pooka assertfd(s);
398 1.1 pooka rc_recvmsg = rumpcalls[RUMPCALL_RECVMSG];
399 1.2 pooka return rc_recvmsg(fd_host2rump(s), msg, flags);
400 1.1 pooka }
401 1.1 pooka
402 1.1 pooka ssize_t
403 1.1 pooka send(int s, const void *buf, size_t len, int flags)
404 1.1 pooka {
405 1.1 pooka
406 1.1 pooka return sendto(s, buf, len, flags, NULL, 0);
407 1.1 pooka }
408 1.1 pooka
409 1.1 pooka ssize_t
410 1.1 pooka sendto(int s, const void *buf, size_t len, int flags,
411 1.1 pooka const struct sockaddr *to, socklen_t tolen)
412 1.1 pooka {
413 1.1 pooka int (*rc_sendto)(int, const void *, size_t, int,
414 1.1 pooka const struct sockaddr *, socklen_t);
415 1.1 pooka
416 1.1 pooka if (s == -1)
417 1.1 pooka return len;
418 1.1 pooka
419 1.1 pooka DPRINTF(("sendto\n"));
420 1.1 pooka assertfd(s);
421 1.1 pooka rc_sendto = rumpcalls[RUMPCALL_SENDTO];
422 1.2 pooka return rc_sendto(fd_host2rump(s), buf, len, flags, to, tolen);
423 1.1 pooka }
424 1.1 pooka
425 1.1 pooka ssize_t
426 1.1 pooka sendmsg(int s, const struct msghdr *msg, int flags)
427 1.1 pooka {
428 1.1 pooka int (*rc_sendmsg)(int, const struct msghdr *, int);
429 1.1 pooka
430 1.1 pooka DPRINTF(("sendmsg\n"));
431 1.1 pooka assertfd(s);
432 1.1 pooka rc_sendmsg = rumpcalls[RUMPCALL_SENDTO];
433 1.2 pooka return rc_sendmsg(fd_host2rump(s), msg, flags);
434 1.1 pooka }
435 1.1 pooka
436 1.1 pooka int
437 1.1 pooka getsockopt(int s, int level, int optname, void *optval, socklen_t *optlen)
438 1.1 pooka {
439 1.1 pooka int (*rc_getsockopt)(int, int, int, void *, socklen_t *);
440 1.1 pooka
441 1.7 pooka DPRINTF(("getsockopt -> %d\n", s));
442 1.1 pooka assertfd(s);
443 1.1 pooka rc_getsockopt = rumpcalls[RUMPCALL_GETSOCKOPT];
444 1.2 pooka return rc_getsockopt(fd_host2rump(s), level, optname, optval, optlen);
445 1.1 pooka }
446 1.1 pooka
447 1.1 pooka int
448 1.1 pooka setsockopt(int s, int level, int optname, const void *optval, socklen_t optlen)
449 1.1 pooka {
450 1.1 pooka int (*rc_setsockopt)(int, int, int, const void *, socklen_t);
451 1.1 pooka
452 1.7 pooka DPRINTF(("setsockopt -> %d\n", s));
453 1.7 pooka if (fd_isrump(s)) {
454 1.7 pooka rc_setsockopt = rumpcalls[RUMPCALL_SETSOCKOPT];
455 1.7 pooka s = fd_host2rump(s);
456 1.7 pooka } else {
457 1.7 pooka rc_setsockopt = host_setsockopt;
458 1.7 pooka }
459 1.7 pooka return rc_setsockopt(s, level, optname, optval, optlen);
460 1.1 pooka }
461 1.1 pooka
462 1.1 pooka int
463 1.1 pooka shutdown(int s, int how)
464 1.1 pooka {
465 1.1 pooka int (*rc_shutdown)(int, int);
466 1.1 pooka
467 1.7 pooka DPRINTF(("shutdown -> %d\n", s));
468 1.1 pooka assertfd(s);
469 1.1 pooka rc_shutdown = rumpcalls[RUMPCALL_SHUTDOWN];
470 1.2 pooka return rc_shutdown(fd_host2rump(s), how);
471 1.2 pooka }
472 1.2 pooka
473 1.2 pooka /*
474 1.2 pooka * dup2 is special. we allow dup2 of a rump kernel fd to 0-2 since
475 1.2 pooka * many programs do that. dup2 of a rump kernel fd to another value
476 1.2 pooka * not >= fdoff is an error.
477 1.2 pooka *
478 1.2 pooka * Note: cannot rump2host newd, because it is often hardcoded.
479 1.2 pooka *
480 1.2 pooka * XXX: should disable debug prints after stdout/stderr are dup2'd
481 1.2 pooka */
482 1.2 pooka int
483 1.2 pooka dup2(int oldd, int newd)
484 1.2 pooka {
485 1.2 pooka int rv;
486 1.2 pooka
487 1.2 pooka DPRINTF(("dup2 -> %d (o) -> %d (n)\n", oldd, newd));
488 1.2 pooka
489 1.2 pooka if (fd_isrump(oldd)) {
490 1.2 pooka if (!(newd >= 0 && newd <= 2))
491 1.2 pooka return EBADF;
492 1.2 pooka oldd = fd_host2rump(oldd);
493 1.2 pooka rv = rump_sys_dup2(oldd, newd);
494 1.2 pooka if (rv != -1)
495 1.2 pooka dup2mask |= newd+1;
496 1.2 pooka return rv;
497 1.2 pooka } else {
498 1.2 pooka return host_dup2(oldd, newd);
499 1.2 pooka }
500 1.2 pooka }
501 1.2 pooka
502 1.2 pooka /*
503 1.2 pooka * We just wrap fork the appropriate rump client calls to preserve
504 1.2 pooka * the file descriptors of the forked parent in the child, but
505 1.2 pooka * prevent double use of connection fd.
506 1.2 pooka */
507 1.2 pooka
508 1.2 pooka pid_t
509 1.2 pooka fork()
510 1.2 pooka {
511 1.2 pooka struct rumpclient_fork *rf;
512 1.2 pooka pid_t rv;
513 1.2 pooka
514 1.2 pooka DPRINTF(("fork\n"));
515 1.2 pooka
516 1.2 pooka if ((rf = rumpclient_prefork()) == NULL)
517 1.2 pooka return -1;
518 1.2 pooka
519 1.2 pooka switch ((rv = host_fork())) {
520 1.2 pooka case -1:
521 1.2 pooka /* XXX: cancel rf */
522 1.2 pooka break;
523 1.2 pooka case 0:
524 1.2 pooka if (rumpclient_fork_init(rf) == -1)
525 1.2 pooka rv = -1;
526 1.2 pooka break;
527 1.2 pooka default:
528 1.2 pooka break;
529 1.2 pooka }
530 1.2 pooka
531 1.2 pooka DPRINTF(("fork returns %d\n", rv));
532 1.2 pooka return rv;
533 1.1 pooka }
534 1.1 pooka
535 1.1 pooka /*
536 1.1 pooka * Hybrids
537 1.1 pooka */
538 1.1 pooka
539 1.1 pooka ssize_t
540 1.1 pooka read(int fd, void *buf, size_t len)
541 1.1 pooka {
542 1.1 pooka int (*op_read)(int, void *, size_t);
543 1.1 pooka ssize_t n;
544 1.1 pooka
545 1.1 pooka DPRINTF(("read %d\n", fd));
546 1.2 pooka if (fd_isrump(fd)) {
547 1.2 pooka fd = fd_host2rump(fd);
548 1.2 pooka op_read = rumpcalls[RUMPCALL_READ];
549 1.2 pooka } else {
550 1.1 pooka op_read = host_read;
551 1.1 pooka }
552 1.1 pooka
553 1.1 pooka n = op_read(fd, buf, len);
554 1.1 pooka return n;
555 1.1 pooka }
556 1.1 pooka
557 1.1 pooka ssize_t
558 1.1 pooka readv(int fd, const struct iovec *iov, int iovcnt)
559 1.1 pooka {
560 1.1 pooka int (*op_readv)(int, const struct iovec *, int);
561 1.1 pooka
562 1.7 pooka DPRINTF(("readv %d\n", fd));
563 1.2 pooka if (fd_isrump(fd)) {
564 1.2 pooka fd = fd_host2rump(fd);
565 1.2 pooka op_readv = rumpcalls[RUMPCALL_READV];
566 1.2 pooka } else {
567 1.1 pooka op_readv = host_readv;
568 1.1 pooka }
569 1.1 pooka
570 1.1 pooka return op_readv(fd, iov, iovcnt);
571 1.1 pooka }
572 1.1 pooka
573 1.1 pooka ssize_t
574 1.1 pooka write(int fd, const void *buf, size_t len)
575 1.1 pooka {
576 1.1 pooka int (*op_write)(int, const void *, size_t);
577 1.1 pooka
578 1.2 pooka if (fd_isrump(fd)) {
579 1.2 pooka fd = fd_host2rump(fd);
580 1.2 pooka op_write = rumpcalls[RUMPCALL_WRITE];
581 1.2 pooka } else {
582 1.1 pooka op_write = host_write;
583 1.1 pooka }
584 1.1 pooka
585 1.1 pooka return op_write(fd, buf, len);
586 1.1 pooka }
587 1.1 pooka
588 1.1 pooka ssize_t
589 1.1 pooka writev(int fd, const struct iovec *iov, int iovcnt)
590 1.1 pooka {
591 1.1 pooka int (*op_writev)(int, const struct iovec *, int);
592 1.1 pooka
593 1.7 pooka DPRINTF(("writev %d\n", fd));
594 1.2 pooka if (fd_isrump(fd)) {
595 1.2 pooka fd = fd_host2rump(fd);
596 1.2 pooka op_writev = rumpcalls[RUMPCALL_WRITEV];
597 1.2 pooka } else {
598 1.1 pooka op_writev = host_writev;
599 1.1 pooka }
600 1.1 pooka
601 1.1 pooka return op_writev(fd, iov, iovcnt);
602 1.1 pooka }
603 1.1 pooka
604 1.1 pooka int
605 1.1 pooka ioctl(int fd, unsigned long cmd, ...)
606 1.1 pooka {
607 1.1 pooka int (*op_ioctl)(int, unsigned long cmd, ...);
608 1.1 pooka va_list ap;
609 1.1 pooka int rv;
610 1.1 pooka
611 1.1 pooka DPRINTF(("ioctl\n"));
612 1.2 pooka if (fd_isrump(fd)) {
613 1.2 pooka fd = fd_host2rump(fd);
614 1.2 pooka op_ioctl = rumpcalls[RUMPCALL_IOCTL];
615 1.2 pooka } else {
616 1.1 pooka op_ioctl = host_ioctl;
617 1.1 pooka }
618 1.1 pooka
619 1.1 pooka va_start(ap, cmd);
620 1.1 pooka rv = op_ioctl(fd, cmd, va_arg(ap, void *));
621 1.1 pooka va_end(ap);
622 1.1 pooka return rv;
623 1.1 pooka }
624 1.1 pooka
625 1.1 pooka int
626 1.1 pooka fcntl(int fd, int cmd, ...)
627 1.1 pooka {
628 1.1 pooka int (*op_fcntl)(int, int, ...);
629 1.1 pooka va_list ap;
630 1.1 pooka int rv;
631 1.1 pooka
632 1.1 pooka DPRINTF(("fcntl\n"));
633 1.2 pooka if (fd_isrump(fd)) {
634 1.2 pooka fd = fd_host2rump(fd);
635 1.2 pooka op_fcntl = rumpcalls[RUMPCALL_FCNTL];
636 1.2 pooka } else {
637 1.1 pooka op_fcntl = host_fcntl;
638 1.1 pooka }
639 1.1 pooka
640 1.1 pooka va_start(ap, cmd);
641 1.1 pooka rv = op_fcntl(fd, cmd, va_arg(ap, void *));
642 1.1 pooka va_end(ap);
643 1.1 pooka return rv;
644 1.1 pooka }
645 1.1 pooka
646 1.1 pooka int
647 1.1 pooka close(int fd)
648 1.1 pooka {
649 1.1 pooka int (*op_close)(int);
650 1.1 pooka
651 1.1 pooka DPRINTF(("close %d\n", fd));
652 1.2 pooka if (fd_isrump(fd)) {
653 1.2 pooka fd = fd_host2rump(fd);
654 1.2 pooka op_close = rumpcalls[RUMPCALL_CLOSE];
655 1.2 pooka } else {
656 1.1 pooka op_close = host_close;
657 1.1 pooka }
658 1.1 pooka
659 1.1 pooka return op_close(fd);
660 1.1 pooka }
661 1.1 pooka
662 1.4 pooka int
663 1.4 pooka select(int nfds, fd_set *readfds, fd_set *writefds, fd_set *exceptfds,
664 1.4 pooka struct timeval *timeout)
665 1.1 pooka {
666 1.4 pooka struct pollfd *pfds;
667 1.4 pooka struct timespec ts, *tsp = NULL;
668 1.4 pooka nfds_t i, j, realnfds;
669 1.4 pooka int rv, incr;
670 1.4 pooka
671 1.7 pooka DPRINTF(("select\n"));
672 1.7 pooka
673 1.4 pooka /*
674 1.4 pooka * Well, first we must scan the fds to figure out how many
675 1.4 pooka * fds there really are. This is because up to and including
676 1.4 pooka * nb5 poll() silently refuses nfds > process_open_fds.
677 1.4 pooka * Seems to be fixed in current, thank the maker.
678 1.4 pooka * god damn cluster...bomb.
679 1.4 pooka */
680 1.4 pooka
681 1.4 pooka for (i = 0, realnfds = 0; i < nfds; i++) {
682 1.4 pooka if (readfds && FD_ISSET(i, readfds)) {
683 1.4 pooka realnfds++;
684 1.4 pooka continue;
685 1.4 pooka }
686 1.4 pooka if (writefds && FD_ISSET(i, writefds)) {
687 1.4 pooka realnfds++;
688 1.4 pooka continue;
689 1.4 pooka }
690 1.4 pooka if (exceptfds && FD_ISSET(i, exceptfds)) {
691 1.4 pooka realnfds++;
692 1.4 pooka continue;
693 1.1 pooka }
694 1.1 pooka }
695 1.1 pooka
696 1.6 pooka if (realnfds) {
697 1.6 pooka pfds = malloc(sizeof(*pfds) * realnfds);
698 1.6 pooka if (!pfds)
699 1.6 pooka return -1;
700 1.6 pooka } else {
701 1.6 pooka pfds = NULL;
702 1.6 pooka }
703 1.1 pooka
704 1.4 pooka for (i = 0, j = 0; i < nfds; i++) {
705 1.4 pooka incr = 0;
706 1.4 pooka pfds[j].events = pfds[j].revents = 0;
707 1.4 pooka if (readfds && FD_ISSET(i, readfds)) {
708 1.4 pooka pfds[j].fd = i;
709 1.4 pooka pfds[j].events |= POLLIN;
710 1.4 pooka incr=1;
711 1.4 pooka }
712 1.4 pooka if (writefds && FD_ISSET(i, writefds)) {
713 1.4 pooka pfds[j].fd = i;
714 1.4 pooka pfds[j].events |= POLLOUT;
715 1.4 pooka incr=1;
716 1.4 pooka }
717 1.4 pooka if (exceptfds && FD_ISSET(i, exceptfds)) {
718 1.4 pooka pfds[j].fd = i;
719 1.4 pooka pfds[j].events |= POLLHUP|POLLERR;
720 1.4 pooka incr=1;
721 1.1 pooka }
722 1.4 pooka if (incr)
723 1.4 pooka j++;
724 1.1 pooka }
725 1.1 pooka
726 1.4 pooka if (timeout) {
727 1.4 pooka TIMEVAL_TO_TIMESPEC(timeout, &ts);
728 1.4 pooka tsp = &ts;
729 1.4 pooka }
730 1.4 pooka rv = pollts(pfds, realnfds, tsp, NULL);
731 1.4 pooka if (rv <= 0)
732 1.4 pooka goto out;
733 1.4 pooka
734 1.4 pooka /*
735 1.4 pooka * ok, harvest results. first zero out entries (can't use
736 1.4 pooka * FD_ZERO for the obvious select-me-not reason). whee.
737 1.4 pooka */
738 1.4 pooka for (i = 0; i < nfds; i++) {
739 1.4 pooka if (readfds)
740 1.4 pooka FD_CLR(i, readfds);
741 1.4 pooka if (writefds)
742 1.4 pooka FD_CLR(i, writefds);
743 1.4 pooka if (exceptfds)
744 1.4 pooka FD_CLR(i, exceptfds);
745 1.1 pooka }
746 1.1 pooka
747 1.4 pooka /* and then plug in the results */
748 1.4 pooka for (i = 0; i < realnfds; i++) {
749 1.4 pooka if (readfds) {
750 1.4 pooka if (pfds[i].revents & POLLIN) {
751 1.4 pooka FD_SET(pfds[i].fd, readfds);
752 1.4 pooka }
753 1.4 pooka }
754 1.4 pooka if (writefds) {
755 1.4 pooka if (pfds[i].revents & POLLOUT) {
756 1.4 pooka FD_SET(pfds[i].fd, writefds);
757 1.4 pooka }
758 1.4 pooka }
759 1.4 pooka if (exceptfds) {
760 1.4 pooka if (pfds[i].revents & (POLLHUP|POLLERR)) {
761 1.4 pooka FD_SET(pfds[i].fd, exceptfds);
762 1.4 pooka }
763 1.4 pooka }
764 1.1 pooka }
765 1.1 pooka
766 1.4 pooka out:
767 1.4 pooka free(pfds);
768 1.1 pooka return rv;
769 1.1 pooka }
770 1.1 pooka
771 1.1 pooka static void
772 1.1 pooka checkpoll(struct pollfd *fds, nfds_t nfds, int *hostcall, int *rumpcall)
773 1.1 pooka {
774 1.1 pooka nfds_t i;
775 1.1 pooka
776 1.1 pooka for (i = 0; i < nfds; i++) {
777 1.2 pooka if (fd_isrump(fds[i].fd))
778 1.2 pooka (*rumpcall)++;
779 1.2 pooka else
780 1.1 pooka (*hostcall)++;
781 1.1 pooka }
782 1.1 pooka }
783 1.1 pooka
784 1.1 pooka static void
785 1.2 pooka adjustpoll(struct pollfd *fds, nfds_t nfds, int (*fdadj)(int))
786 1.1 pooka {
787 1.1 pooka nfds_t i;
788 1.1 pooka
789 1.1 pooka for (i = 0; i < nfds; i++) {
790 1.2 pooka fds[i].fd = fdadj(fds[i].fd);
791 1.1 pooka }
792 1.1 pooka }
793 1.1 pooka
794 1.1 pooka /*
795 1.1 pooka * poll is easy as long as the call comes in the fds only in one
796 1.1 pooka * kernel. otherwise its quite tricky...
797 1.1 pooka */
798 1.1 pooka struct pollarg {
799 1.1 pooka struct pollfd *pfds;
800 1.1 pooka nfds_t nfds;
801 1.3 pooka const struct timespec *ts;
802 1.3 pooka const sigset_t *sigmask;
803 1.1 pooka int pipefd;
804 1.1 pooka int errnum;
805 1.1 pooka };
806 1.1 pooka
807 1.1 pooka static void *
808 1.1 pooka hostpoll(void *arg)
809 1.1 pooka {
810 1.1 pooka struct pollarg *parg = arg;
811 1.1 pooka intptr_t rv;
812 1.1 pooka
813 1.3 pooka rv = host_pollts(parg->pfds, parg->nfds, parg->ts, parg->sigmask);
814 1.1 pooka if (rv == -1)
815 1.1 pooka parg->errnum = errno;
816 1.1 pooka rump_sys_write(parg->pipefd, &rv, sizeof(rv));
817 1.1 pooka
818 1.1 pooka return (void *)(intptr_t)rv;
819 1.1 pooka }
820 1.1 pooka
821 1.1 pooka int
822 1.3 pooka pollts(struct pollfd *fds, nfds_t nfds, const struct timespec *ts,
823 1.3 pooka const sigset_t *sigmask)
824 1.1 pooka {
825 1.3 pooka int (*op_pollts)(struct pollfd *, nfds_t, const struct timespec *,
826 1.3 pooka const sigset_t *);
827 1.1 pooka int hostcall = 0, rumpcall = 0;
828 1.1 pooka pthread_t pt;
829 1.1 pooka nfds_t i;
830 1.1 pooka int rv;
831 1.1 pooka
832 1.2 pooka DPRINTF(("poll\n"));
833 1.1 pooka checkpoll(fds, nfds, &hostcall, &rumpcall);
834 1.1 pooka
835 1.1 pooka if (hostcall && rumpcall) {
836 1.1 pooka struct pollfd *pfd_host = NULL, *pfd_rump = NULL;
837 1.1 pooka int rpipe[2] = {-1,-1}, hpipe[2] = {-1,-1};
838 1.1 pooka struct pollarg parg;
839 1.1 pooka uintptr_t lrv;
840 1.1 pooka int sverrno = 0, trv;
841 1.1 pooka
842 1.1 pooka /*
843 1.1 pooka * ok, this is where it gets tricky. We must support
844 1.1 pooka * this since it's a very common operation in certain
845 1.1 pooka * types of software (telnet, netcat, etc). We allocate
846 1.1 pooka * two vectors and run two poll commands in separate
847 1.1 pooka * threads. Whichever returns first "wins" and the
848 1.1 pooka * other kernel's fds won't show activity.
849 1.1 pooka */
850 1.1 pooka rv = -1;
851 1.1 pooka
852 1.1 pooka /* allocate full vector for O(n) joining after call */
853 1.1 pooka pfd_host = malloc(sizeof(*pfd_host)*(nfds+1));
854 1.1 pooka if (!pfd_host)
855 1.1 pooka goto out;
856 1.1 pooka pfd_rump = malloc(sizeof(*pfd_rump)*(nfds+1));
857 1.1 pooka if (!pfd_rump) {
858 1.1 pooka goto out;
859 1.1 pooka }
860 1.1 pooka
861 1.1 pooka /* split vectors */
862 1.1 pooka for (i = 0; i < nfds; i++) {
863 1.3 pooka if (fds[i].fd == -1) {
864 1.3 pooka pfd_host[i].fd = -1;
865 1.3 pooka pfd_rump[i].fd = -1;
866 1.3 pooka } else if (fd_isrump(fds[i].fd)) {
867 1.2 pooka pfd_host[i].fd = -1;
868 1.2 pooka pfd_rump[i].fd = fd_host2rump(fds[i].fd);
869 1.2 pooka pfd_rump[i].events = fds[i].events;
870 1.2 pooka } else {
871 1.2 pooka pfd_rump[i].fd = -1;
872 1.1 pooka pfd_host[i].fd = fds[i].fd;
873 1.1 pooka pfd_host[i].events = fds[i].events;
874 1.1 pooka }
875 1.1 pooka }
876 1.1 pooka
877 1.1 pooka /*
878 1.1 pooka * then, open two pipes, one for notifications
879 1.1 pooka * to each kernel.
880 1.1 pooka */
881 1.1 pooka if (rump_sys_pipe(rpipe) == -1)
882 1.1 pooka goto out;
883 1.1 pooka if (pipe(hpipe) == -1)
884 1.1 pooka goto out;
885 1.1 pooka
886 1.1 pooka pfd_host[nfds].fd = hpipe[0];
887 1.1 pooka pfd_host[nfds].events = POLLIN;
888 1.1 pooka pfd_rump[nfds].fd = rpipe[0];
889 1.1 pooka pfd_rump[nfds].events = POLLIN;
890 1.1 pooka
891 1.1 pooka /*
892 1.1 pooka * then, create a thread to do host part and meanwhile
893 1.1 pooka * do rump kernel part right here
894 1.1 pooka */
895 1.1 pooka
896 1.1 pooka parg.pfds = pfd_host;
897 1.1 pooka parg.nfds = nfds+1;
898 1.3 pooka parg.ts = ts;
899 1.3 pooka parg.sigmask = sigmask;
900 1.1 pooka parg.pipefd = rpipe[1];
901 1.1 pooka pthread_create(&pt, NULL, hostpoll, &parg);
902 1.1 pooka
903 1.3 pooka op_pollts = rumpcalls[RUMPCALL_POLLTS];
904 1.3 pooka lrv = op_pollts(pfd_rump, nfds+1, ts, NULL);
905 1.1 pooka sverrno = errno;
906 1.1 pooka write(hpipe[1], &rv, sizeof(rv));
907 1.1 pooka pthread_join(pt, (void *)&trv);
908 1.1 pooka
909 1.1 pooka /* check who "won" and merge results */
910 1.1 pooka if (lrv != 0 && pfd_host[nfds].revents & POLLIN) {
911 1.1 pooka rv = trv;
912 1.1 pooka
913 1.1 pooka for (i = 0; i < nfds; i++) {
914 1.1 pooka if (pfd_rump[i].fd != -1)
915 1.1 pooka fds[i].revents = pfd_rump[i].revents;
916 1.1 pooka }
917 1.1 pooka sverrno = parg.errnum;
918 1.1 pooka } else if (trv != 0 && pfd_rump[nfds].revents & POLLIN) {
919 1.1 pooka rv = trv;
920 1.1 pooka
921 1.1 pooka for (i = 0; i < nfds; i++) {
922 1.1 pooka if (pfd_host[i].fd != -1)
923 1.1 pooka fds[i].revents = pfd_host[i].revents;
924 1.1 pooka }
925 1.1 pooka } else {
926 1.1 pooka rv = 0;
927 1.1 pooka }
928 1.1 pooka
929 1.1 pooka out:
930 1.1 pooka if (rpipe[0] != -1)
931 1.1 pooka rump_sys_close(rpipe[0]);
932 1.1 pooka if (rpipe[1] != -1)
933 1.1 pooka rump_sys_close(rpipe[1]);
934 1.1 pooka if (hpipe[0] != -1)
935 1.1 pooka close(hpipe[0]);
936 1.1 pooka if (hpipe[1] != -1)
937 1.1 pooka close(hpipe[1]);
938 1.1 pooka free(pfd_host);
939 1.1 pooka free(pfd_rump);
940 1.1 pooka errno = sverrno;
941 1.1 pooka } else {
942 1.1 pooka if (hostcall) {
943 1.3 pooka op_pollts = host_pollts;
944 1.1 pooka } else {
945 1.3 pooka op_pollts = rumpcalls[RUMPCALL_POLLTS];
946 1.2 pooka adjustpoll(fds, nfds, fd_host2rump);
947 1.1 pooka }
948 1.1 pooka
949 1.3 pooka rv = op_pollts(fds, nfds, ts, sigmask);
950 1.1 pooka if (rumpcall)
951 1.2 pooka adjustpoll(fds, nfds, fd_rump2host);
952 1.1 pooka }
953 1.1 pooka
954 1.1 pooka return rv;
955 1.1 pooka }
956 1.1 pooka
957 1.1 pooka int
958 1.3 pooka poll(struct pollfd *fds, nfds_t nfds, int timeout)
959 1.1 pooka {
960 1.3 pooka struct timespec ts;
961 1.3 pooka struct timespec *tsp = NULL;
962 1.3 pooka
963 1.3 pooka if (timeout != INFTIM) {
964 1.3 pooka ts.tv_sec = timeout / 1000;
965 1.3 pooka ts.tv_nsec = (timeout % 1000) * 1000;
966 1.3 pooka
967 1.3 pooka tsp = &ts;
968 1.3 pooka }
969 1.1 pooka
970 1.3 pooka return pollts(fds, nfds, tsp, NULL);
971 1.1 pooka }
972