rumpuser.c revision 1.30 1 1.30 pooka /* $NetBSD: rumpuser.c,v 1.30 2013/04/27 14:59:08 pooka Exp $ */
2 1.1 pooka
3 1.1 pooka /*
4 1.1 pooka * Copyright (c) 2007-2010 Antti Kantee. All Rights Reserved.
5 1.1 pooka *
6 1.1 pooka * Redistribution and use in source and binary forms, with or without
7 1.1 pooka * modification, are permitted provided that the following conditions
8 1.1 pooka * are met:
9 1.1 pooka * 1. Redistributions of source code must retain the above copyright
10 1.1 pooka * notice, this list of conditions and the following disclaimer.
11 1.1 pooka * 2. Redistributions in binary form must reproduce the above copyright
12 1.1 pooka * notice, this list of conditions and the following disclaimer in the
13 1.1 pooka * documentation and/or other materials provided with the distribution.
14 1.1 pooka *
15 1.1 pooka * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
16 1.1 pooka * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
17 1.1 pooka * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
18 1.1 pooka * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
19 1.1 pooka * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20 1.1 pooka * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
21 1.1 pooka * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22 1.1 pooka * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
23 1.1 pooka * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
24 1.1 pooka * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
25 1.1 pooka * SUCH DAMAGE.
26 1.1 pooka */
27 1.1 pooka
28 1.18 pooka #include "rumpuser_port.h"
29 1.18 pooka
30 1.1 pooka #if !defined(lint)
31 1.30 pooka __RCSID("$NetBSD: rumpuser.c,v 1.30 2013/04/27 14:59:08 pooka Exp $");
32 1.1 pooka #endif /* !lint */
33 1.1 pooka
34 1.1 pooka #include <sys/ioctl.h>
35 1.1 pooka #include <sys/mman.h>
36 1.1 pooka #include <sys/uio.h>
37 1.18 pooka #include <sys/stat.h>
38 1.18 pooka #include <sys/time.h>
39 1.1 pooka
40 1.1 pooka #ifdef __NetBSD__
41 1.15 pooka #include <sys/disk.h>
42 1.1 pooka #include <sys/disklabel.h>
43 1.15 pooka #include <sys/dkio.h>
44 1.25 pooka #include <sys/event.h>
45 1.25 pooka #endif
46 1.25 pooka
47 1.25 pooka #if defined(__NetBSD__) || defined(__FreeBSD__) || defined(__DragonFly__)
48 1.4 pooka #include <sys/sysctl.h>
49 1.1 pooka #endif
50 1.1 pooka
51 1.1 pooka #include <assert.h>
52 1.1 pooka #include <errno.h>
53 1.1 pooka #include <fcntl.h>
54 1.23 pooka #include <netdb.h>
55 1.1 pooka #include <poll.h>
56 1.2 pooka #include <signal.h>
57 1.1 pooka #include <stdarg.h>
58 1.1 pooka #include <stdint.h>
59 1.1 pooka #include <stdio.h>
60 1.1 pooka #include <stdlib.h>
61 1.1 pooka #include <string.h>
62 1.1 pooka #include <time.h>
63 1.1 pooka #include <unistd.h>
64 1.1 pooka
65 1.1 pooka #include <rump/rumpuser.h>
66 1.1 pooka
67 1.1 pooka #include "rumpuser_int.h"
68 1.1 pooka
69 1.30 pooka rump_unschedulefn rumpuser__unschedule;
70 1.30 pooka rump_reschedulefn rumpuser__reschedule;
71 1.30 pooka
72 1.1 pooka int
73 1.30 pooka rumpuser_init(int version,
74 1.30 pooka rump_reschedulefn rumpkern_resched, rump_unschedulefn rumpkern_unsched)
75 1.8 pooka {
76 1.8 pooka
77 1.30 pooka if (version != RUMPUSER_VERSION) {
78 1.30 pooka fprintf(stderr, "rumpuser mismatch, kern: %d, hypervisor %d\n",
79 1.30 pooka version, RUMPUSER_VERSION);
80 1.30 pooka return 1;
81 1.30 pooka }
82 1.30 pooka
83 1.30 pooka #ifdef RUMPUSER_USE_RANDOM
84 1.30 pooka uint32_t rv;
85 1.30 pooka int fd;
86 1.30 pooka
87 1.30 pooka if ((fd = open("/dev/urandom", O_RDONLY)) == -1) {
88 1.30 pooka srandom(time(NULL));
89 1.30 pooka } else {
90 1.30 pooka if (read(fd, &rv, sizeof(rv)) != sizeof(rv))
91 1.30 pooka srandom(time(NULL));
92 1.30 pooka else
93 1.30 pooka srandom(rv);
94 1.30 pooka close(fd);
95 1.30 pooka }
96 1.30 pooka #endif
97 1.30 pooka
98 1.30 pooka rumpuser__thrinit();
99 1.30 pooka
100 1.30 pooka rumpuser__unschedule = rumpkern_unsched;
101 1.30 pooka rumpuser__reschedule = rumpkern_resched;
102 1.30 pooka
103 1.30 pooka return 0;
104 1.8 pooka }
105 1.8 pooka
106 1.8 pooka int
107 1.1 pooka rumpuser_getfileinfo(const char *path, uint64_t *sizep, int *ftp, int *error)
108 1.1 pooka {
109 1.1 pooka struct stat sb;
110 1.1 pooka uint64_t size;
111 1.1 pooka int needsdev = 0, rv = 0, ft;
112 1.12 pooka int fd = -1;
113 1.1 pooka
114 1.1 pooka if (stat(path, &sb) == -1) {
115 1.10 pooka seterror(errno);
116 1.1 pooka return -1;
117 1.1 pooka }
118 1.1 pooka
119 1.1 pooka switch (sb.st_mode & S_IFMT) {
120 1.1 pooka case S_IFDIR:
121 1.1 pooka ft = RUMPUSER_FT_DIR;
122 1.1 pooka break;
123 1.1 pooka case S_IFREG:
124 1.1 pooka ft = RUMPUSER_FT_REG;
125 1.1 pooka break;
126 1.1 pooka case S_IFBLK:
127 1.1 pooka ft = RUMPUSER_FT_BLK;
128 1.1 pooka needsdev = 1;
129 1.1 pooka break;
130 1.1 pooka case S_IFCHR:
131 1.1 pooka ft = RUMPUSER_FT_CHR;
132 1.1 pooka needsdev = 1;
133 1.1 pooka break;
134 1.1 pooka default:
135 1.1 pooka ft = RUMPUSER_FT_OTHER;
136 1.1 pooka break;
137 1.1 pooka }
138 1.1 pooka
139 1.1 pooka if (!needsdev) {
140 1.1 pooka size = sb.st_size;
141 1.1 pooka } else if (sizep) {
142 1.1 pooka /*
143 1.1 pooka * Welcome to the jungle. Of course querying the kernel
144 1.1 pooka * for a device partition size is supposed to be far from
145 1.1 pooka * trivial. On NetBSD we use ioctl. On $other platform
146 1.1 pooka * we have a problem. We try "the lseek trick" and just
147 1.1 pooka * fail if that fails. Platform specific code can later
148 1.1 pooka * be written here if appropriate.
149 1.1 pooka *
150 1.1 pooka * On NetBSD we hope and pray that for block devices nobody
151 1.1 pooka * else is holding them open, because otherwise the kernel
152 1.1 pooka * will not permit us to open it. Thankfully, this is
153 1.1 pooka * usually called only in bootstrap and then we can
154 1.1 pooka * forget about it.
155 1.1 pooka */
156 1.1 pooka #ifndef __NetBSD__
157 1.1 pooka off_t off;
158 1.1 pooka
159 1.1 pooka fd = open(path, O_RDONLY);
160 1.1 pooka if (fd == -1) {
161 1.10 pooka seterror(errno);
162 1.1 pooka rv = -1;
163 1.1 pooka goto out;
164 1.1 pooka }
165 1.1 pooka
166 1.1 pooka off = lseek(fd, 0, SEEK_END);
167 1.1 pooka if (off != 0) {
168 1.1 pooka size = off;
169 1.1 pooka goto out;
170 1.1 pooka }
171 1.1 pooka fprintf(stderr, "error: device size query not implemented on "
172 1.1 pooka "this platform\n");
173 1.12 pooka seterror(EOPNOTSUPP);
174 1.1 pooka rv = -1;
175 1.1 pooka goto out;
176 1.1 pooka #else
177 1.1 pooka struct disklabel lab;
178 1.1 pooka struct partition *parta;
179 1.15 pooka struct dkwedge_info dkw;
180 1.1 pooka
181 1.1 pooka fd = open(path, O_RDONLY);
182 1.1 pooka if (fd == -1) {
183 1.10 pooka seterror(errno);
184 1.1 pooka rv = -1;
185 1.1 pooka goto out;
186 1.1 pooka }
187 1.1 pooka
188 1.15 pooka if (ioctl(fd, DIOCGDINFO, &lab) == 0) {
189 1.15 pooka parta = &lab.d_partitions[DISKPART(sb.st_rdev)];
190 1.15 pooka size = (uint64_t)lab.d_secsize * parta->p_size;
191 1.15 pooka goto out;
192 1.15 pooka }
193 1.15 pooka
194 1.15 pooka if (ioctl(fd, DIOCGWEDGEINFO, &dkw) == 0) {
195 1.15 pooka /*
196 1.15 pooka * XXX: should use DIOCGDISKINFO to query
197 1.15 pooka * sector size, but that requires proplib,
198 1.15 pooka * so just don't bother for now. it's nice
199 1.15 pooka * that something as difficult as figuring out
200 1.15 pooka * a partition's size has been made so easy.
201 1.15 pooka */
202 1.15 pooka size = dkw.dkw_size << DEV_BSHIFT;
203 1.1 pooka goto out;
204 1.1 pooka }
205 1.1 pooka
206 1.15 pooka seterror(errno);
207 1.15 pooka rv = -1;
208 1.1 pooka #endif /* __NetBSD__ */
209 1.1 pooka }
210 1.1 pooka
211 1.1 pooka out:
212 1.1 pooka if (rv == 0 && sizep)
213 1.1 pooka *sizep = size;
214 1.1 pooka if (rv == 0 && ftp)
215 1.1 pooka *ftp = ft;
216 1.12 pooka if (fd != -1)
217 1.12 pooka close(fd);
218 1.1 pooka
219 1.1 pooka return rv;
220 1.1 pooka }
221 1.1 pooka
222 1.1 pooka int
223 1.1 pooka rumpuser_nanosleep(uint64_t *sec, uint64_t *nsec, int *error)
224 1.1 pooka {
225 1.1 pooka struct timespec rqt, rmt;
226 1.1 pooka int rv;
227 1.1 pooka
228 1.1 pooka /*LINTED*/
229 1.1 pooka rqt.tv_sec = *sec;
230 1.1 pooka /*LINTED*/
231 1.1 pooka rqt.tv_nsec = *nsec;
232 1.1 pooka
233 1.1 pooka KLOCK_WRAP(rv = nanosleep(&rqt, &rmt));
234 1.1 pooka if (rv == -1)
235 1.10 pooka seterror(errno);
236 1.1 pooka
237 1.1 pooka *sec = rmt.tv_sec;
238 1.1 pooka *nsec = rmt.tv_nsec;
239 1.1 pooka
240 1.1 pooka return rv;
241 1.1 pooka }
242 1.1 pooka
243 1.1 pooka void *
244 1.5 pooka rumpuser_malloc(size_t howmuch, int alignment)
245 1.1 pooka {
246 1.5 pooka void *mem;
247 1.6 pooka int rv;
248 1.5 pooka
249 1.5 pooka if (alignment == 0)
250 1.5 pooka alignment = sizeof(void *);
251 1.1 pooka
252 1.14 pooka rv = posix_memalign(&mem, (size_t)alignment, howmuch);
253 1.6 pooka if (__predict_false(rv != 0)) {
254 1.6 pooka if (rv == EINVAL) {
255 1.6 pooka printf("rumpuser_malloc: invalid alignment %d\n",
256 1.6 pooka alignment);
257 1.6 pooka abort();
258 1.6 pooka }
259 1.6 pooka mem = NULL;
260 1.6 pooka }
261 1.1 pooka
262 1.5 pooka return mem;
263 1.1 pooka }
264 1.1 pooka
265 1.1 pooka void *
266 1.5 pooka rumpuser_realloc(void *ptr, size_t howmuch)
267 1.1 pooka {
268 1.1 pooka
269 1.5 pooka return realloc(ptr, howmuch);
270 1.1 pooka }
271 1.1 pooka
272 1.1 pooka void
273 1.1 pooka rumpuser_free(void *ptr)
274 1.1 pooka {
275 1.1 pooka
276 1.1 pooka free(ptr);
277 1.1 pooka }
278 1.1 pooka
279 1.1 pooka void *
280 1.7 pooka rumpuser_anonmmap(void *prefaddr, size_t size, int alignbit,
281 1.7 pooka int exec, int *error)
282 1.1 pooka {
283 1.1 pooka void *rv;
284 1.1 pooka int prot;
285 1.1 pooka
286 1.18 pooka #ifndef MAP_ALIGNED
287 1.18 pooka #define MAP_ALIGNED(a) 0
288 1.18 pooka if (alignbit)
289 1.18 pooka fprintf(stderr, "rumpuser_anonmmap: warning, requested "
290 1.18 pooka "alignment not supported by hypervisor\n");
291 1.18 pooka #endif
292 1.18 pooka
293 1.1 pooka prot = PROT_READ|PROT_WRITE;
294 1.1 pooka if (exec)
295 1.1 pooka prot |= PROT_EXEC;
296 1.7 pooka rv = mmap(prefaddr, size, prot,
297 1.24 pooka MAP_PRIVATE | MAP_ANON | MAP_ALIGNED(alignbit), -1, 0);
298 1.1 pooka if (rv == MAP_FAILED) {
299 1.10 pooka seterror(errno);
300 1.1 pooka return NULL;
301 1.1 pooka }
302 1.1 pooka return rv;
303 1.1 pooka }
304 1.1 pooka
305 1.1 pooka void
306 1.1 pooka rumpuser_unmap(void *addr, size_t len)
307 1.1 pooka {
308 1.1 pooka int rv;
309 1.1 pooka
310 1.1 pooka rv = munmap(addr, len);
311 1.1 pooka assert(rv == 0);
312 1.1 pooka }
313 1.1 pooka
314 1.1 pooka void *
315 1.1 pooka rumpuser_filemmap(int fd, off_t offset, size_t len, int flags, int *error)
316 1.1 pooka {
317 1.1 pooka void *rv;
318 1.1 pooka int mmflags, prot;
319 1.1 pooka
320 1.22 pooka if (flags & RUMPUSER_FILEMMAP_TRUNCATE) {
321 1.22 pooka if (ftruncate(fd, offset + len) == -1) {
322 1.22 pooka seterror(errno);
323 1.22 pooka return NULL;
324 1.22 pooka }
325 1.22 pooka }
326 1.1 pooka
327 1.23 pooka /* it's implicit */
328 1.23 pooka #if defined(__sun__) && !defined(MAP_FILE)
329 1.23 pooka #define MAP_FILE 0
330 1.23 pooka #endif
331 1.23 pooka
332 1.1 pooka mmflags = MAP_FILE;
333 1.1 pooka if (flags & RUMPUSER_FILEMMAP_SHARED)
334 1.1 pooka mmflags |= MAP_SHARED;
335 1.1 pooka else
336 1.1 pooka mmflags |= MAP_PRIVATE;
337 1.1 pooka
338 1.1 pooka prot = 0;
339 1.1 pooka if (flags & RUMPUSER_FILEMMAP_READ)
340 1.1 pooka prot |= PROT_READ;
341 1.1 pooka if (flags & RUMPUSER_FILEMMAP_WRITE)
342 1.1 pooka prot |= PROT_WRITE;
343 1.1 pooka
344 1.1 pooka rv = mmap(NULL, len, PROT_READ|PROT_WRITE, mmflags, fd, offset);
345 1.1 pooka if (rv == MAP_FAILED) {
346 1.10 pooka seterror(errno);
347 1.1 pooka return NULL;
348 1.1 pooka }
349 1.1 pooka
350 1.10 pooka seterror(0);
351 1.1 pooka return rv;
352 1.1 pooka }
353 1.1 pooka
354 1.1 pooka int
355 1.1 pooka rumpuser_memsync(void *addr, size_t len, int *error)
356 1.1 pooka {
357 1.1 pooka
358 1.1 pooka DOCALL_KLOCK(int, (msync(addr, len, MS_SYNC)));
359 1.1 pooka }
360 1.1 pooka
361 1.1 pooka int
362 1.20 pooka rumpuser_open(const char *path, int ruflags, int *error)
363 1.1 pooka {
364 1.20 pooka int flags;
365 1.1 pooka
366 1.20 pooka switch (ruflags & RUMPUSER_OPEN_ACCMODE) {
367 1.20 pooka case RUMPUSER_OPEN_RDONLY:
368 1.20 pooka flags = O_RDONLY;
369 1.20 pooka break;
370 1.20 pooka case RUMPUSER_OPEN_WRONLY:
371 1.20 pooka flags = O_WRONLY;
372 1.20 pooka break;
373 1.20 pooka case RUMPUSER_OPEN_RDWR:
374 1.20 pooka flags = O_RDWR;
375 1.20 pooka break;
376 1.20 pooka default:
377 1.20 pooka *error = EINVAL;
378 1.20 pooka return -1;
379 1.20 pooka }
380 1.20 pooka
381 1.20 pooka #define TESTSET(_ru_, _h_) if (ruflags & _ru_) flags |= _h_;
382 1.20 pooka TESTSET(RUMPUSER_OPEN_CREATE, O_CREAT);
383 1.20 pooka TESTSET(RUMPUSER_OPEN_EXCL, O_EXCL);
384 1.23 pooka #ifdef O_DIRECT
385 1.20 pooka TESTSET(RUMPUSER_OPEN_DIRECT, O_DIRECT);
386 1.23 pooka #else
387 1.23 pooka if (ruflags & RUMPUSER_OPEN_DIRECT) {
388 1.23 pooka *error = EOPNOTSUPP;
389 1.23 pooka return -1;
390 1.23 pooka }
391 1.23 pooka #endif
392 1.20 pooka #undef TESTSET
393 1.20 pooka
394 1.20 pooka DOCALL_KLOCK(int, (open(path, flags, 0644)));
395 1.1 pooka }
396 1.1 pooka
397 1.1 pooka int
398 1.1 pooka rumpuser_ioctl(int fd, u_long cmd, void *data, int *error)
399 1.1 pooka {
400 1.1 pooka
401 1.1 pooka DOCALL_KLOCK(int, (ioctl(fd, cmd, data)));
402 1.1 pooka }
403 1.1 pooka
404 1.1 pooka int
405 1.1 pooka rumpuser_close(int fd, int *error)
406 1.1 pooka {
407 1.1 pooka
408 1.1 pooka DOCALL(int, close(fd));
409 1.1 pooka }
410 1.1 pooka
411 1.1 pooka int
412 1.1 pooka rumpuser_fsync(int fd, int *error)
413 1.1 pooka {
414 1.1 pooka
415 1.1 pooka DOCALL_KLOCK(int, fsync(fd));
416 1.1 pooka }
417 1.1 pooka
418 1.1 pooka ssize_t
419 1.1 pooka rumpuser_read(int fd, void *data, size_t size, int *error)
420 1.1 pooka {
421 1.1 pooka ssize_t rv;
422 1.1 pooka
423 1.1 pooka KLOCK_WRAP(rv = read(fd, data, size));
424 1.1 pooka if (rv == -1)
425 1.10 pooka seterror(errno);
426 1.1 pooka
427 1.1 pooka return rv;
428 1.1 pooka }
429 1.1 pooka
430 1.1 pooka ssize_t
431 1.1 pooka rumpuser_pread(int fd, void *data, size_t size, off_t offset, int *error)
432 1.1 pooka {
433 1.1 pooka ssize_t rv;
434 1.1 pooka
435 1.1 pooka KLOCK_WRAP(rv = pread(fd, data, size, offset));
436 1.1 pooka if (rv == -1)
437 1.10 pooka seterror(errno);
438 1.1 pooka
439 1.1 pooka return rv;
440 1.1 pooka }
441 1.1 pooka
442 1.1 pooka void
443 1.1 pooka rumpuser_read_bio(int fd, void *data, size_t size, off_t offset,
444 1.1 pooka rump_biodone_fn biodone, void *biodonecookie)
445 1.1 pooka {
446 1.1 pooka ssize_t rv;
447 1.1 pooka int error = 0;
448 1.1 pooka
449 1.1 pooka rv = rumpuser_pread(fd, data, size, offset, &error);
450 1.1 pooka /* check against <0 instead of ==-1 to get typing below right */
451 1.1 pooka if (rv < 0)
452 1.1 pooka rv = 0;
453 1.1 pooka
454 1.1 pooka /* LINTED: see above */
455 1.1 pooka biodone(biodonecookie, rv, error);
456 1.1 pooka }
457 1.1 pooka
458 1.1 pooka ssize_t
459 1.1 pooka rumpuser_write(int fd, const void *data, size_t size, int *error)
460 1.1 pooka {
461 1.1 pooka ssize_t rv;
462 1.1 pooka
463 1.1 pooka KLOCK_WRAP(rv = write(fd, data, size));
464 1.1 pooka if (rv == -1)
465 1.10 pooka seterror(errno);
466 1.1 pooka
467 1.1 pooka return rv;
468 1.1 pooka }
469 1.1 pooka
470 1.1 pooka ssize_t
471 1.1 pooka rumpuser_pwrite(int fd, const void *data, size_t size, off_t offset, int *error)
472 1.1 pooka {
473 1.1 pooka ssize_t rv;
474 1.1 pooka
475 1.1 pooka KLOCK_WRAP(rv = pwrite(fd, data, size, offset));
476 1.1 pooka if (rv == -1)
477 1.10 pooka seterror(errno);
478 1.1 pooka
479 1.1 pooka return rv;
480 1.1 pooka }
481 1.1 pooka
482 1.1 pooka void
483 1.1 pooka rumpuser_write_bio(int fd, const void *data, size_t size, off_t offset,
484 1.1 pooka rump_biodone_fn biodone, void *biodonecookie)
485 1.1 pooka {
486 1.1 pooka ssize_t rv;
487 1.1 pooka int error = 0;
488 1.1 pooka
489 1.1 pooka rv = rumpuser_pwrite(fd, data, size, offset, &error);
490 1.1 pooka /* check against <0 instead of ==-1 to get typing below right */
491 1.1 pooka if (rv < 0)
492 1.1 pooka rv = 0;
493 1.1 pooka
494 1.1 pooka /* LINTED: see above */
495 1.1 pooka biodone(biodonecookie, rv, error);
496 1.1 pooka }
497 1.1 pooka
498 1.1 pooka ssize_t
499 1.1 pooka rumpuser_readv(int fd, const struct rumpuser_iovec *riov, int iovcnt,
500 1.1 pooka int *error)
501 1.1 pooka {
502 1.1 pooka struct iovec *iovp;
503 1.1 pooka ssize_t rv;
504 1.1 pooka int i;
505 1.1 pooka
506 1.1 pooka iovp = malloc(iovcnt * sizeof(struct iovec));
507 1.1 pooka if (iovp == NULL) {
508 1.10 pooka seterror(ENOMEM);
509 1.1 pooka return -1;
510 1.1 pooka }
511 1.1 pooka for (i = 0; i < iovcnt; i++) {
512 1.1 pooka iovp[i].iov_base = riov[i].iov_base;
513 1.1 pooka /*LINTED*/
514 1.1 pooka iovp[i].iov_len = riov[i].iov_len;
515 1.1 pooka }
516 1.1 pooka
517 1.1 pooka KLOCK_WRAP(rv = readv(fd, iovp, iovcnt));
518 1.1 pooka if (rv == -1)
519 1.10 pooka seterror(errno);
520 1.1 pooka free(iovp);
521 1.1 pooka
522 1.1 pooka return rv;
523 1.1 pooka }
524 1.1 pooka
525 1.1 pooka ssize_t
526 1.1 pooka rumpuser_writev(int fd, const struct rumpuser_iovec *riov, int iovcnt,
527 1.1 pooka int *error)
528 1.1 pooka {
529 1.1 pooka struct iovec *iovp;
530 1.1 pooka ssize_t rv;
531 1.1 pooka int i;
532 1.1 pooka
533 1.1 pooka iovp = malloc(iovcnt * sizeof(struct iovec));
534 1.1 pooka if (iovp == NULL) {
535 1.10 pooka seterror(ENOMEM);
536 1.1 pooka return -1;
537 1.1 pooka }
538 1.1 pooka for (i = 0; i < iovcnt; i++) {
539 1.1 pooka iovp[i].iov_base = riov[i].iov_base;
540 1.1 pooka /*LINTED*/
541 1.1 pooka iovp[i].iov_len = riov[i].iov_len;
542 1.1 pooka }
543 1.1 pooka
544 1.1 pooka KLOCK_WRAP(rv = writev(fd, iovp, iovcnt));
545 1.1 pooka if (rv == -1)
546 1.10 pooka seterror(errno);
547 1.1 pooka free(iovp);
548 1.1 pooka
549 1.1 pooka return rv;
550 1.1 pooka }
551 1.1 pooka
552 1.1 pooka int
553 1.1 pooka rumpuser_gettime(uint64_t *sec, uint64_t *nsec, int *error)
554 1.1 pooka {
555 1.1 pooka struct timeval tv;
556 1.1 pooka int rv;
557 1.1 pooka
558 1.1 pooka rv = gettimeofday(&tv, NULL);
559 1.1 pooka if (rv == -1) {
560 1.10 pooka seterror(errno);
561 1.1 pooka return rv;
562 1.1 pooka }
563 1.1 pooka
564 1.1 pooka *sec = tv.tv_sec;
565 1.1 pooka *nsec = tv.tv_usec * 1000;
566 1.1 pooka
567 1.1 pooka return 0;
568 1.1 pooka }
569 1.1 pooka
570 1.1 pooka int
571 1.1 pooka rumpuser_getenv(const char *name, char *buf, size_t blen, int *error)
572 1.1 pooka {
573 1.1 pooka
574 1.1 pooka DOCALL(int, getenv_r(name, buf, blen));
575 1.1 pooka }
576 1.1 pooka
577 1.1 pooka int
578 1.1 pooka rumpuser_gethostname(char *name, size_t namelen, int *error)
579 1.1 pooka {
580 1.13 pooka char tmp[MAXHOSTNAMELEN];
581 1.1 pooka
582 1.13 pooka if (gethostname(tmp, sizeof(tmp)) == -1) {
583 1.23 pooka snprintf(name, namelen, "rump-%05d.rumpdomain", (int)getpid());
584 1.13 pooka } else {
585 1.13 pooka snprintf(name, namelen, "rump-%05d.%s.rumpdomain",
586 1.23 pooka (int)getpid(), tmp);
587 1.13 pooka }
588 1.13 pooka
589 1.13 pooka *error = 0;
590 1.13 pooka return 0;
591 1.1 pooka }
592 1.1 pooka
593 1.1 pooka int
594 1.1 pooka rumpuser_poll(struct pollfd *fds, int nfds, int timeout, int *error)
595 1.1 pooka {
596 1.1 pooka
597 1.1 pooka DOCALL_KLOCK(int, (poll(fds, (nfds_t)nfds, timeout)));
598 1.1 pooka }
599 1.1 pooka
600 1.1 pooka int
601 1.1 pooka rumpuser_putchar(int c, int *error)
602 1.1 pooka {
603 1.1 pooka
604 1.1 pooka DOCALL(int, (putchar(c)));
605 1.1 pooka }
606 1.1 pooka
607 1.1 pooka void
608 1.1 pooka rumpuser_exit(int rv)
609 1.1 pooka {
610 1.1 pooka
611 1.1 pooka if (rv == RUMPUSER_PANIC)
612 1.1 pooka abort();
613 1.1 pooka else
614 1.1 pooka exit(rv);
615 1.1 pooka }
616 1.1 pooka
617 1.1 pooka void
618 1.1 pooka rumpuser_seterrno(int error)
619 1.1 pooka {
620 1.1 pooka
621 1.1 pooka errno = error;
622 1.1 pooka }
623 1.1 pooka
624 1.21 pooka /*
625 1.21 pooka * On NetBSD we use kqueue, on Linux we use inotify. The underlying
626 1.21 pooka * interface requirements aren't quite the same, but we have a very
627 1.21 pooka * good chance of doing the fd->path mapping on Linux thanks to dcache,
628 1.21 pooka * so just keep the existing interfaces for now.
629 1.21 pooka */
630 1.21 pooka #if defined(__NetBSD__)
631 1.1 pooka int
632 1.1 pooka rumpuser_writewatchfile_setup(int kq, int fd, intptr_t opaque, int *error)
633 1.1 pooka {
634 1.1 pooka struct kevent kev;
635 1.1 pooka
636 1.1 pooka if (kq == -1) {
637 1.1 pooka kq = kqueue();
638 1.1 pooka if (kq == -1) {
639 1.10 pooka seterror(errno);
640 1.1 pooka return -1;
641 1.1 pooka }
642 1.1 pooka }
643 1.1 pooka
644 1.1 pooka EV_SET(&kev, fd, EVFILT_VNODE, EV_ADD|EV_ENABLE|EV_CLEAR,
645 1.1 pooka NOTE_WRITE, 0, opaque);
646 1.1 pooka if (kevent(kq, &kev, 1, NULL, 0, NULL) == -1) {
647 1.10 pooka seterror(errno);
648 1.1 pooka return -1;
649 1.1 pooka }
650 1.1 pooka
651 1.1 pooka return kq;
652 1.1 pooka }
653 1.1 pooka
654 1.1 pooka int
655 1.1 pooka rumpuser_writewatchfile_wait(int kq, intptr_t *opaque, int *error)
656 1.1 pooka {
657 1.1 pooka struct kevent kev;
658 1.1 pooka int rv;
659 1.1 pooka
660 1.9 pooka again:
661 1.1 pooka KLOCK_WRAP(rv = kevent(kq, NULL, 0, &kev, 1, NULL));
662 1.1 pooka if (rv == -1) {
663 1.9 pooka if (errno == EINTR)
664 1.9 pooka goto again;
665 1.10 pooka seterror(errno);
666 1.1 pooka return -1;
667 1.1 pooka }
668 1.1 pooka
669 1.1 pooka if (opaque)
670 1.1 pooka *opaque = kev.udata;
671 1.1 pooka return rv;
672 1.1 pooka }
673 1.21 pooka
674 1.21 pooka #elif defined(__linux__)
675 1.21 pooka #include <sys/inotify.h>
676 1.21 pooka
677 1.21 pooka int
678 1.21 pooka rumpuser_writewatchfile_setup(int inotify, int fd, intptr_t notused, int *error)
679 1.21 pooka {
680 1.21 pooka char procbuf[PATH_MAX], linkbuf[PATH_MAX];
681 1.21 pooka ssize_t nn;
682 1.21 pooka
683 1.21 pooka if (inotify == -1) {
684 1.21 pooka inotify = inotify_init();
685 1.21 pooka if (inotify == -1) {
686 1.21 pooka seterror(errno);
687 1.21 pooka return -1;
688 1.21 pooka }
689 1.21 pooka }
690 1.21 pooka
691 1.21 pooka /* ok, need to map fd into path for inotify */
692 1.21 pooka snprintf(procbuf, sizeof(procbuf), "/proc/self/fd/%d", fd);
693 1.29 pooka nn = readlink(procbuf, linkbuf, sizeof(linkbuf)-1);
694 1.29 pooka if (nn >= (ssize_t)sizeof(linkbuf)-1) {
695 1.21 pooka nn = -1;
696 1.21 pooka errno = E2BIG; /* pick something */
697 1.21 pooka }
698 1.21 pooka if (nn == -1) {
699 1.21 pooka seterror(errno);
700 1.21 pooka close(inotify);
701 1.21 pooka return -1;
702 1.21 pooka }
703 1.21 pooka
704 1.29 pooka linkbuf[nn] = '\0';
705 1.21 pooka if (inotify_add_watch(inotify, linkbuf, IN_MODIFY) == -1) {
706 1.21 pooka seterror(errno);
707 1.21 pooka close(inotify);
708 1.21 pooka return -1;
709 1.21 pooka }
710 1.21 pooka
711 1.21 pooka return inotify;
712 1.21 pooka }
713 1.21 pooka
714 1.21 pooka int
715 1.21 pooka rumpuser_writewatchfile_wait(int kq, intptr_t *opaque, int *error)
716 1.21 pooka {
717 1.21 pooka struct inotify_event iev;
718 1.21 pooka ssize_t nn;
719 1.21 pooka
720 1.21 pooka do {
721 1.21 pooka KLOCK_WRAP(nn = read(kq, &iev, sizeof(iev)));
722 1.21 pooka } while (errno == EINTR);
723 1.21 pooka
724 1.21 pooka if (nn == -1) {
725 1.21 pooka seterror(errno);
726 1.21 pooka return -1;
727 1.21 pooka }
728 1.21 pooka return (nn/sizeof(iev));
729 1.21 pooka }
730 1.26 pooka
731 1.26 pooka #else
732 1.26 pooka
733 1.26 pooka /* a polling default implementation */
734 1.26 pooka int
735 1.26 pooka rumpuser_writewatchfile_setup(int inotify, int fd, intptr_t notused, int *error)
736 1.26 pooka {
737 1.26 pooka static int warned = 0;
738 1.26 pooka
739 1.26 pooka if (!warned) {
740 1.27 pooka fprintf(stderr, "WARNING: rumpuser writewatchfile routines are "
741 1.26 pooka "polling-only on this platform\n");
742 1.26 pooka warned = 1;
743 1.26 pooka }
744 1.26 pooka
745 1.26 pooka return 0;
746 1.26 pooka }
747 1.26 pooka
748 1.26 pooka int
749 1.26 pooka rumpuser_writewatchfile_wait(int kq, intptr_t *opaque, int *error)
750 1.26 pooka {
751 1.26 pooka
752 1.26 pooka KLOCK_WRAP(usleep(10000));
753 1.26 pooka return 0;
754 1.26 pooka }
755 1.18 pooka #endif
756 1.1 pooka
757 1.1 pooka /*
758 1.1 pooka * This is meant for safe debugging prints from the kernel.
759 1.1 pooka */
760 1.1 pooka int
761 1.1 pooka rumpuser_dprintf(const char *format, ...)
762 1.1 pooka {
763 1.1 pooka va_list ap;
764 1.1 pooka int rv;
765 1.1 pooka
766 1.1 pooka va_start(ap, format);
767 1.9 pooka rv = vfprintf(stderr, format, ap);
768 1.1 pooka va_end(ap);
769 1.1 pooka
770 1.1 pooka return rv;
771 1.1 pooka }
772 1.2 pooka
773 1.2 pooka int
774 1.2 pooka rumpuser_kill(int64_t pid, int sig, int *error)
775 1.2 pooka {
776 1.2 pooka
777 1.3 pooka #ifdef __NetBSD__
778 1.2 pooka if (pid == RUMPUSER_PID_SELF) {
779 1.2 pooka DOCALL(int, raise(sig));
780 1.2 pooka } else {
781 1.2 pooka DOCALL(int, kill((pid_t)pid, sig));
782 1.2 pooka }
783 1.3 pooka #else
784 1.3 pooka /* XXXfixme: signal numbers may not match on non-NetBSD */
785 1.10 pooka seterror(EOPNOTSUPP);
786 1.3 pooka return -1;
787 1.3 pooka #endif
788 1.2 pooka }
789 1.4 pooka
790 1.4 pooka int
791 1.4 pooka rumpuser_getnhostcpu(void)
792 1.4 pooka {
793 1.18 pooka int ncpu = 1;
794 1.18 pooka
795 1.25 pooka #if defined(__NetBSD__) || defined(__FreeBSD__) || defined(__DragonFly__)
796 1.4 pooka size_t sz = sizeof(ncpu);
797 1.4 pooka
798 1.18 pooka sysctlbyname("hw.ncpu", &ncpu, &sz, NULL, 0);
799 1.28 pooka #elif defined(__linux__) || defined(__CYGWIN__)
800 1.18 pooka FILE *fp;
801 1.18 pooka char *line = NULL;
802 1.18 pooka size_t n = 0;
803 1.18 pooka
804 1.18 pooka /* If anyone knows a better way, I'm all ears */
805 1.18 pooka if ((fp = fopen("/proc/cpuinfo", "r")) != NULL) {
806 1.18 pooka ncpu = 0;
807 1.18 pooka while (getline(&line, &n, fp) != -1) {
808 1.18 pooka if (strncmp(line,
809 1.18 pooka "processor", sizeof("processor")-1) == 0)
810 1.18 pooka ncpu++;
811 1.18 pooka }
812 1.18 pooka if (ncpu == 0)
813 1.18 pooka ncpu = 1;
814 1.18 pooka free(line);
815 1.18 pooka fclose(fp);
816 1.18 pooka }
817 1.23 pooka #elif __sun__
818 1.23 pooka /* XXX: this is just a rough estimate ... */
819 1.23 pooka ncpu = sysconf(_SC_NPROCESSORS_ONLN);
820 1.18 pooka #endif
821 1.18 pooka
822 1.4 pooka return ncpu;
823 1.4 pooka }
824 1.16 tls
825 1.18 pooka /* XXX: this hypercall needs a better name */
826 1.16 tls uint32_t
827 1.16 tls rumpuser_arc4random(void)
828 1.16 tls {
829 1.18 pooka
830 1.16 tls return arc4random();
831 1.16 tls }
832