Home | History | Annotate | Line # | Download | only in librumpuser
rumpuser.c revision 1.21
      1  1.21  pooka /*	$NetBSD: rumpuser.c,v 1.21 2012/10/10 11:15:57 pooka Exp $	*/
      2   1.1  pooka 
      3   1.1  pooka /*
      4   1.1  pooka  * Copyright (c) 2007-2010 Antti Kantee.  All Rights Reserved.
      5   1.1  pooka  *
      6   1.1  pooka  * Redistribution and use in source and binary forms, with or without
      7   1.1  pooka  * modification, are permitted provided that the following conditions
      8   1.1  pooka  * are met:
      9   1.1  pooka  * 1. Redistributions of source code must retain the above copyright
     10   1.1  pooka  *    notice, this list of conditions and the following disclaimer.
     11   1.1  pooka  * 2. Redistributions in binary form must reproduce the above copyright
     12   1.1  pooka  *    notice, this list of conditions and the following disclaimer in the
     13   1.1  pooka  *    documentation and/or other materials provided with the distribution.
     14   1.1  pooka  *
     15   1.1  pooka  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
     16   1.1  pooka  * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
     17   1.1  pooka  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
     18   1.1  pooka  * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     19   1.1  pooka  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     20   1.1  pooka  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
     21   1.1  pooka  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     22   1.1  pooka  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     23   1.1  pooka  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     24   1.1  pooka  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     25   1.1  pooka  * SUCH DAMAGE.
     26   1.1  pooka  */
     27   1.1  pooka 
     28  1.18  pooka #include "rumpuser_port.h"
     29  1.18  pooka 
     30   1.1  pooka #if !defined(lint)
     31  1.21  pooka __RCSID("$NetBSD: rumpuser.c,v 1.21 2012/10/10 11:15:57 pooka Exp $");
     32   1.1  pooka #endif /* !lint */
     33   1.1  pooka 
     34   1.1  pooka #include <sys/ioctl.h>
     35   1.1  pooka #include <sys/mman.h>
     36   1.1  pooka #include <sys/uio.h>
     37  1.18  pooka #include <sys/stat.h>
     38  1.18  pooka #include <sys/time.h>
     39   1.1  pooka 
     40   1.1  pooka #ifdef __NetBSD__
     41  1.15  pooka #include <sys/disk.h>
     42   1.1  pooka #include <sys/disklabel.h>
     43  1.15  pooka #include <sys/dkio.h>
     44   1.4  pooka #include <sys/sysctl.h>
     45  1.18  pooka #include <sys/event.h>
     46   1.1  pooka #endif
     47   1.1  pooka 
     48   1.1  pooka #include <assert.h>
     49   1.1  pooka #include <err.h>
     50   1.1  pooka #include <errno.h>
     51   1.1  pooka #include <fcntl.h>
     52   1.1  pooka #include <poll.h>
     53   1.2  pooka #include <signal.h>
     54   1.1  pooka #include <stdarg.h>
     55   1.1  pooka #include <stdint.h>
     56   1.1  pooka #include <stdio.h>
     57   1.1  pooka #include <stdlib.h>
     58   1.1  pooka #include <string.h>
     59   1.1  pooka #include <time.h>
     60   1.1  pooka #include <unistd.h>
     61   1.1  pooka 
     62   1.1  pooka #include <rump/rumpuser.h>
     63   1.1  pooka 
     64   1.1  pooka #include "rumpuser_int.h"
     65   1.1  pooka 
     66   1.1  pooka int
     67  1.17    abs rumpuser_getversion(void)
     68   1.8  pooka {
     69   1.8  pooka 
     70   1.8  pooka 	return RUMPUSER_VERSION;
     71   1.8  pooka }
     72   1.8  pooka 
     73   1.8  pooka int
     74   1.1  pooka rumpuser_getfileinfo(const char *path, uint64_t *sizep, int *ftp, int *error)
     75   1.1  pooka {
     76   1.1  pooka 	struct stat sb;
     77   1.1  pooka 	uint64_t size;
     78   1.1  pooka 	int needsdev = 0, rv = 0, ft;
     79  1.12  pooka 	int fd = -1;
     80   1.1  pooka 
     81   1.1  pooka 	if (stat(path, &sb) == -1) {
     82  1.10  pooka 		seterror(errno);
     83   1.1  pooka 		return -1;
     84   1.1  pooka 	}
     85   1.1  pooka 
     86   1.1  pooka 	switch (sb.st_mode & S_IFMT) {
     87   1.1  pooka 	case S_IFDIR:
     88   1.1  pooka 		ft = RUMPUSER_FT_DIR;
     89   1.1  pooka 		break;
     90   1.1  pooka 	case S_IFREG:
     91   1.1  pooka 		ft = RUMPUSER_FT_REG;
     92   1.1  pooka 		break;
     93   1.1  pooka 	case S_IFBLK:
     94   1.1  pooka 		ft = RUMPUSER_FT_BLK;
     95   1.1  pooka 		needsdev = 1;
     96   1.1  pooka 		break;
     97   1.1  pooka 	case S_IFCHR:
     98   1.1  pooka 		ft = RUMPUSER_FT_CHR;
     99   1.1  pooka 		needsdev = 1;
    100   1.1  pooka 		break;
    101   1.1  pooka 	default:
    102   1.1  pooka 		ft = RUMPUSER_FT_OTHER;
    103   1.1  pooka 		break;
    104   1.1  pooka 	}
    105   1.1  pooka 
    106   1.1  pooka 	if (!needsdev) {
    107   1.1  pooka 		size = sb.st_size;
    108   1.1  pooka 	} else if (sizep) {
    109   1.1  pooka 		/*
    110   1.1  pooka 		 * Welcome to the jungle.  Of course querying the kernel
    111   1.1  pooka 		 * for a device partition size is supposed to be far from
    112   1.1  pooka 		 * trivial.  On NetBSD we use ioctl.  On $other platform
    113   1.1  pooka 		 * we have a problem.  We try "the lseek trick" and just
    114   1.1  pooka 		 * fail if that fails.  Platform specific code can later
    115   1.1  pooka 		 * be written here if appropriate.
    116   1.1  pooka 		 *
    117   1.1  pooka 		 * On NetBSD we hope and pray that for block devices nobody
    118   1.1  pooka 		 * else is holding them open, because otherwise the kernel
    119   1.1  pooka 		 * will not permit us to open it.  Thankfully, this is
    120   1.1  pooka 		 * usually called only in bootstrap and then we can
    121   1.1  pooka 		 * forget about it.
    122   1.1  pooka 		 */
    123   1.1  pooka #ifndef __NetBSD__
    124   1.1  pooka 		off_t off;
    125   1.1  pooka 
    126   1.1  pooka 		fd = open(path, O_RDONLY);
    127   1.1  pooka 		if (fd == -1) {
    128  1.10  pooka 			seterror(errno);
    129   1.1  pooka 			rv = -1;
    130   1.1  pooka 			goto out;
    131   1.1  pooka 		}
    132   1.1  pooka 
    133   1.1  pooka 		off = lseek(fd, 0, SEEK_END);
    134   1.1  pooka 		if (off != 0) {
    135   1.1  pooka 			size = off;
    136   1.1  pooka 			goto out;
    137   1.1  pooka 		}
    138   1.1  pooka 		fprintf(stderr, "error: device size query not implemented on "
    139   1.1  pooka 		    "this platform\n");
    140  1.12  pooka 		seterror(EOPNOTSUPP);
    141   1.1  pooka 		rv = -1;
    142   1.1  pooka 		goto out;
    143   1.1  pooka #else
    144   1.1  pooka 		struct disklabel lab;
    145   1.1  pooka 		struct partition *parta;
    146  1.15  pooka 		struct dkwedge_info dkw;
    147   1.1  pooka 
    148   1.1  pooka 		fd = open(path, O_RDONLY);
    149   1.1  pooka 		if (fd == -1) {
    150  1.10  pooka 			seterror(errno);
    151   1.1  pooka 			rv = -1;
    152   1.1  pooka 			goto out;
    153   1.1  pooka 		}
    154   1.1  pooka 
    155  1.15  pooka 		if (ioctl(fd, DIOCGDINFO, &lab) == 0) {
    156  1.15  pooka 			parta = &lab.d_partitions[DISKPART(sb.st_rdev)];
    157  1.15  pooka 			size = (uint64_t)lab.d_secsize * parta->p_size;
    158  1.15  pooka 			goto out;
    159  1.15  pooka 		}
    160  1.15  pooka 
    161  1.15  pooka 		if (ioctl(fd, DIOCGWEDGEINFO, &dkw) == 0) {
    162  1.15  pooka 			/*
    163  1.15  pooka 			 * XXX: should use DIOCGDISKINFO to query
    164  1.15  pooka 			 * sector size, but that requires proplib,
    165  1.15  pooka 			 * so just don't bother for now.  it's nice
    166  1.15  pooka 			 * that something as difficult as figuring out
    167  1.15  pooka 			 * a partition's size has been made so easy.
    168  1.15  pooka 			 */
    169  1.15  pooka 			size = dkw.dkw_size << DEV_BSHIFT;
    170   1.1  pooka 			goto out;
    171   1.1  pooka 		}
    172   1.1  pooka 
    173  1.15  pooka 		seterror(errno);
    174  1.15  pooka 		rv = -1;
    175   1.1  pooka #endif /* __NetBSD__ */
    176   1.1  pooka 	}
    177   1.1  pooka 
    178   1.1  pooka  out:
    179   1.1  pooka 	if (rv == 0 && sizep)
    180   1.1  pooka 		*sizep = size;
    181   1.1  pooka 	if (rv == 0 && ftp)
    182   1.1  pooka 		*ftp = ft;
    183  1.12  pooka 	if (fd != -1)
    184  1.12  pooka 		close(fd);
    185   1.1  pooka 
    186   1.1  pooka 	return rv;
    187   1.1  pooka }
    188   1.1  pooka 
    189   1.1  pooka int
    190   1.1  pooka rumpuser_nanosleep(uint64_t *sec, uint64_t *nsec, int *error)
    191   1.1  pooka {
    192   1.1  pooka 	struct timespec rqt, rmt;
    193   1.1  pooka 	int rv;
    194   1.1  pooka 
    195   1.1  pooka 	/*LINTED*/
    196   1.1  pooka 	rqt.tv_sec = *sec;
    197   1.1  pooka 	/*LINTED*/
    198   1.1  pooka 	rqt.tv_nsec = *nsec;
    199   1.1  pooka 
    200   1.1  pooka 	KLOCK_WRAP(rv = nanosleep(&rqt, &rmt));
    201   1.1  pooka 	if (rv == -1)
    202  1.10  pooka 		seterror(errno);
    203   1.1  pooka 
    204   1.1  pooka 	*sec = rmt.tv_sec;
    205   1.1  pooka 	*nsec = rmt.tv_nsec;
    206   1.1  pooka 
    207   1.1  pooka 	return rv;
    208   1.1  pooka }
    209   1.1  pooka 
    210   1.1  pooka void *
    211   1.5  pooka rumpuser_malloc(size_t howmuch, int alignment)
    212   1.1  pooka {
    213   1.5  pooka 	void *mem;
    214   1.6  pooka 	int rv;
    215   1.5  pooka 
    216   1.5  pooka 	if (alignment == 0)
    217   1.5  pooka 		alignment = sizeof(void *);
    218   1.1  pooka 
    219  1.14  pooka 	rv = posix_memalign(&mem, (size_t)alignment, howmuch);
    220   1.6  pooka 	if (__predict_false(rv != 0)) {
    221   1.6  pooka 		if (rv == EINVAL) {
    222   1.6  pooka 			printf("rumpuser_malloc: invalid alignment %d\n",
    223   1.6  pooka 			    alignment);
    224   1.6  pooka 			abort();
    225   1.6  pooka 		}
    226   1.6  pooka 		mem = NULL;
    227   1.6  pooka 	}
    228   1.1  pooka 
    229   1.5  pooka 	return mem;
    230   1.1  pooka }
    231   1.1  pooka 
    232   1.1  pooka void *
    233   1.5  pooka rumpuser_realloc(void *ptr, size_t howmuch)
    234   1.1  pooka {
    235   1.1  pooka 
    236   1.5  pooka 	return realloc(ptr, howmuch);
    237   1.1  pooka }
    238   1.1  pooka 
    239   1.1  pooka void
    240   1.1  pooka rumpuser_free(void *ptr)
    241   1.1  pooka {
    242   1.1  pooka 
    243   1.1  pooka 	free(ptr);
    244   1.1  pooka }
    245   1.1  pooka 
    246   1.1  pooka void *
    247   1.7  pooka rumpuser_anonmmap(void *prefaddr, size_t size, int alignbit,
    248   1.7  pooka 	int exec, int *error)
    249   1.1  pooka {
    250   1.1  pooka 	void *rv;
    251   1.1  pooka 	int prot;
    252   1.1  pooka 
    253  1.18  pooka #ifndef MAP_ALIGNED
    254  1.18  pooka #define MAP_ALIGNED(a) 0
    255  1.18  pooka 	if (alignbit)
    256  1.18  pooka 		fprintf(stderr, "rumpuser_anonmmap: warning, requested "
    257  1.18  pooka 		    "alignment not supported by hypervisor\n");
    258  1.18  pooka #endif
    259  1.18  pooka 
    260   1.1  pooka 	prot = PROT_READ|PROT_WRITE;
    261   1.1  pooka 	if (exec)
    262   1.1  pooka 		prot |= PROT_EXEC;
    263   1.7  pooka 	rv = mmap(prefaddr, size, prot,
    264   1.7  pooka 	    MAP_ANON | MAP_ALIGNED(alignbit), -1, 0);
    265   1.1  pooka 	if (rv == MAP_FAILED) {
    266  1.10  pooka 		seterror(errno);
    267   1.1  pooka 		return NULL;
    268   1.1  pooka 	}
    269   1.1  pooka 	return rv;
    270   1.1  pooka }
    271   1.1  pooka 
    272   1.1  pooka void
    273   1.1  pooka rumpuser_unmap(void *addr, size_t len)
    274   1.1  pooka {
    275   1.1  pooka 	int rv;
    276   1.1  pooka 
    277   1.1  pooka 	rv = munmap(addr, len);
    278   1.1  pooka 	assert(rv == 0);
    279   1.1  pooka }
    280   1.1  pooka 
    281   1.1  pooka void *
    282   1.1  pooka rumpuser_filemmap(int fd, off_t offset, size_t len, int flags, int *error)
    283   1.1  pooka {
    284   1.1  pooka 	void *rv;
    285   1.1  pooka 	int mmflags, prot;
    286   1.1  pooka 
    287   1.1  pooka 	if (flags & RUMPUSER_FILEMMAP_TRUNCATE)
    288   1.1  pooka 		ftruncate(fd, offset + len);
    289   1.1  pooka 
    290   1.1  pooka 	mmflags = MAP_FILE;
    291   1.1  pooka 	if (flags & RUMPUSER_FILEMMAP_SHARED)
    292   1.1  pooka 		mmflags |= MAP_SHARED;
    293   1.1  pooka 	else
    294   1.1  pooka 		mmflags |= MAP_PRIVATE;
    295   1.1  pooka 
    296   1.1  pooka 	prot = 0;
    297   1.1  pooka 	if (flags & RUMPUSER_FILEMMAP_READ)
    298   1.1  pooka 		prot |= PROT_READ;
    299   1.1  pooka 	if (flags & RUMPUSER_FILEMMAP_WRITE)
    300   1.1  pooka 		prot |= PROT_WRITE;
    301   1.1  pooka 
    302   1.1  pooka 	rv = mmap(NULL, len, PROT_READ|PROT_WRITE, mmflags, fd, offset);
    303   1.1  pooka 	if (rv == MAP_FAILED) {
    304  1.10  pooka 		seterror(errno);
    305   1.1  pooka 		return NULL;
    306   1.1  pooka 	}
    307   1.1  pooka 
    308  1.10  pooka 	seterror(0);
    309   1.1  pooka 	return rv;
    310   1.1  pooka }
    311   1.1  pooka 
    312   1.1  pooka int
    313   1.1  pooka rumpuser_memsync(void *addr, size_t len, int *error)
    314   1.1  pooka {
    315   1.1  pooka 
    316   1.1  pooka 	DOCALL_KLOCK(int, (msync(addr, len, MS_SYNC)));
    317   1.1  pooka }
    318   1.1  pooka 
    319   1.1  pooka int
    320  1.20  pooka rumpuser_open(const char *path, int ruflags, int *error)
    321   1.1  pooka {
    322  1.20  pooka 	int flags;
    323   1.1  pooka 
    324  1.20  pooka 	switch (ruflags & RUMPUSER_OPEN_ACCMODE) {
    325  1.20  pooka 	case RUMPUSER_OPEN_RDONLY:
    326  1.20  pooka 		flags = O_RDONLY;
    327  1.20  pooka 		break;
    328  1.20  pooka 	case RUMPUSER_OPEN_WRONLY:
    329  1.20  pooka 		flags = O_WRONLY;
    330  1.20  pooka 		break;
    331  1.20  pooka 	case RUMPUSER_OPEN_RDWR:
    332  1.20  pooka 		flags = O_RDWR;
    333  1.20  pooka 		break;
    334  1.20  pooka 	default:
    335  1.20  pooka 		*error = EINVAL;
    336  1.20  pooka 		return -1;
    337  1.20  pooka 	}
    338  1.20  pooka 
    339  1.20  pooka #define TESTSET(_ru_, _h_) if (ruflags & _ru_) flags |= _h_;
    340  1.20  pooka 	TESTSET(RUMPUSER_OPEN_CREATE, O_CREAT);
    341  1.20  pooka 	TESTSET(RUMPUSER_OPEN_EXCL, O_EXCL);
    342  1.20  pooka 	TESTSET(RUMPUSER_OPEN_DIRECT, O_DIRECT);
    343  1.20  pooka #undef TESTSET
    344  1.20  pooka 
    345  1.20  pooka 	DOCALL_KLOCK(int, (open(path, flags, 0644)));
    346   1.1  pooka }
    347   1.1  pooka 
    348   1.1  pooka int
    349   1.1  pooka rumpuser_ioctl(int fd, u_long cmd, void *data, int *error)
    350   1.1  pooka {
    351   1.1  pooka 
    352   1.1  pooka 	DOCALL_KLOCK(int, (ioctl(fd, cmd, data)));
    353   1.1  pooka }
    354   1.1  pooka 
    355   1.1  pooka int
    356   1.1  pooka rumpuser_close(int fd, int *error)
    357   1.1  pooka {
    358   1.1  pooka 
    359   1.1  pooka 	DOCALL(int, close(fd));
    360   1.1  pooka }
    361   1.1  pooka 
    362   1.1  pooka int
    363   1.1  pooka rumpuser_fsync(int fd, int *error)
    364   1.1  pooka {
    365   1.1  pooka 
    366   1.1  pooka 	DOCALL_KLOCK(int, fsync(fd));
    367   1.1  pooka }
    368   1.1  pooka 
    369   1.1  pooka ssize_t
    370   1.1  pooka rumpuser_read(int fd, void *data, size_t size, int *error)
    371   1.1  pooka {
    372   1.1  pooka 	ssize_t rv;
    373   1.1  pooka 
    374   1.1  pooka 	KLOCK_WRAP(rv = read(fd, data, size));
    375   1.1  pooka 	if (rv == -1)
    376  1.10  pooka 		seterror(errno);
    377   1.1  pooka 
    378   1.1  pooka 	return rv;
    379   1.1  pooka }
    380   1.1  pooka 
    381   1.1  pooka ssize_t
    382   1.1  pooka rumpuser_pread(int fd, void *data, size_t size, off_t offset, int *error)
    383   1.1  pooka {
    384   1.1  pooka 	ssize_t rv;
    385   1.1  pooka 
    386   1.1  pooka 	KLOCK_WRAP(rv = pread(fd, data, size, offset));
    387   1.1  pooka 	if (rv == -1)
    388  1.10  pooka 		seterror(errno);
    389   1.1  pooka 
    390   1.1  pooka 	return rv;
    391   1.1  pooka }
    392   1.1  pooka 
    393   1.1  pooka void
    394   1.1  pooka rumpuser_read_bio(int fd, void *data, size_t size, off_t offset,
    395   1.1  pooka 	rump_biodone_fn biodone, void *biodonecookie)
    396   1.1  pooka {
    397   1.1  pooka 	ssize_t rv;
    398   1.1  pooka 	int error = 0;
    399   1.1  pooka 
    400   1.1  pooka 	rv = rumpuser_pread(fd, data, size, offset, &error);
    401   1.1  pooka 	/* check against <0 instead of ==-1 to get typing below right */
    402   1.1  pooka 	if (rv < 0)
    403   1.1  pooka 		rv = 0;
    404   1.1  pooka 
    405   1.1  pooka 	/* LINTED: see above */
    406   1.1  pooka 	biodone(biodonecookie, rv, error);
    407   1.1  pooka }
    408   1.1  pooka 
    409   1.1  pooka ssize_t
    410   1.1  pooka rumpuser_write(int fd, const void *data, size_t size, int *error)
    411   1.1  pooka {
    412   1.1  pooka 	ssize_t rv;
    413   1.1  pooka 
    414   1.1  pooka 	KLOCK_WRAP(rv = write(fd, data, size));
    415   1.1  pooka 	if (rv == -1)
    416  1.10  pooka 		seterror(errno);
    417   1.1  pooka 
    418   1.1  pooka 	return rv;
    419   1.1  pooka }
    420   1.1  pooka 
    421   1.1  pooka ssize_t
    422   1.1  pooka rumpuser_pwrite(int fd, const void *data, size_t size, off_t offset, int *error)
    423   1.1  pooka {
    424   1.1  pooka 	ssize_t rv;
    425   1.1  pooka 
    426   1.1  pooka 	KLOCK_WRAP(rv = pwrite(fd, data, size, offset));
    427   1.1  pooka 	if (rv == -1)
    428  1.10  pooka 		seterror(errno);
    429   1.1  pooka 
    430   1.1  pooka 	return rv;
    431   1.1  pooka }
    432   1.1  pooka 
    433   1.1  pooka void
    434   1.1  pooka rumpuser_write_bio(int fd, const void *data, size_t size, off_t offset,
    435   1.1  pooka 	rump_biodone_fn biodone, void *biodonecookie)
    436   1.1  pooka {
    437   1.1  pooka 	ssize_t rv;
    438   1.1  pooka 	int error = 0;
    439   1.1  pooka 
    440   1.1  pooka 	rv = rumpuser_pwrite(fd, data, size, offset, &error);
    441   1.1  pooka 	/* check against <0 instead of ==-1 to get typing below right */
    442   1.1  pooka 	if (rv < 0)
    443   1.1  pooka 		rv = 0;
    444   1.1  pooka 
    445   1.1  pooka 	/* LINTED: see above */
    446   1.1  pooka 	biodone(biodonecookie, rv, error);
    447   1.1  pooka }
    448   1.1  pooka 
    449   1.1  pooka ssize_t
    450   1.1  pooka rumpuser_readv(int fd, const struct rumpuser_iovec *riov, int iovcnt,
    451   1.1  pooka 	int *error)
    452   1.1  pooka {
    453   1.1  pooka 	struct iovec *iovp;
    454   1.1  pooka 	ssize_t rv;
    455   1.1  pooka 	int i;
    456   1.1  pooka 
    457   1.1  pooka 	iovp = malloc(iovcnt * sizeof(struct iovec));
    458   1.1  pooka 	if (iovp == NULL) {
    459  1.10  pooka 		seterror(ENOMEM);
    460   1.1  pooka 		return -1;
    461   1.1  pooka 	}
    462   1.1  pooka 	for (i = 0; i < iovcnt; i++) {
    463   1.1  pooka 		iovp[i].iov_base = riov[i].iov_base;
    464   1.1  pooka 		/*LINTED*/
    465   1.1  pooka 		iovp[i].iov_len = riov[i].iov_len;
    466   1.1  pooka 	}
    467   1.1  pooka 
    468   1.1  pooka 	KLOCK_WRAP(rv = readv(fd, iovp, iovcnt));
    469   1.1  pooka 	if (rv == -1)
    470  1.10  pooka 		seterror(errno);
    471   1.1  pooka 	free(iovp);
    472   1.1  pooka 
    473   1.1  pooka 	return rv;
    474   1.1  pooka }
    475   1.1  pooka 
    476   1.1  pooka ssize_t
    477   1.1  pooka rumpuser_writev(int fd, const struct rumpuser_iovec *riov, int iovcnt,
    478   1.1  pooka 	int *error)
    479   1.1  pooka {
    480   1.1  pooka 	struct iovec *iovp;
    481   1.1  pooka 	ssize_t rv;
    482   1.1  pooka 	int i;
    483   1.1  pooka 
    484   1.1  pooka 	iovp = malloc(iovcnt * sizeof(struct iovec));
    485   1.1  pooka 	if (iovp == NULL) {
    486  1.10  pooka 		seterror(ENOMEM);
    487   1.1  pooka 		return -1;
    488   1.1  pooka 	}
    489   1.1  pooka 	for (i = 0; i < iovcnt; i++) {
    490   1.1  pooka 		iovp[i].iov_base = riov[i].iov_base;
    491   1.1  pooka 		/*LINTED*/
    492   1.1  pooka 		iovp[i].iov_len = riov[i].iov_len;
    493   1.1  pooka 	}
    494   1.1  pooka 
    495   1.1  pooka 	KLOCK_WRAP(rv = writev(fd, iovp, iovcnt));
    496   1.1  pooka 	if (rv == -1)
    497  1.10  pooka 		seterror(errno);
    498   1.1  pooka 	free(iovp);
    499   1.1  pooka 
    500   1.1  pooka 	return rv;
    501   1.1  pooka }
    502   1.1  pooka 
    503   1.1  pooka int
    504   1.1  pooka rumpuser_gettime(uint64_t *sec, uint64_t *nsec, int *error)
    505   1.1  pooka {
    506   1.1  pooka 	struct timeval tv;
    507   1.1  pooka 	int rv;
    508   1.1  pooka 
    509   1.1  pooka 	rv = gettimeofday(&tv, NULL);
    510   1.1  pooka 	if (rv == -1) {
    511  1.10  pooka 		seterror(errno);
    512   1.1  pooka 		return rv;
    513   1.1  pooka 	}
    514   1.1  pooka 
    515   1.1  pooka 	*sec = tv.tv_sec;
    516   1.1  pooka 	*nsec = tv.tv_usec * 1000;
    517   1.1  pooka 
    518   1.1  pooka 	return 0;
    519   1.1  pooka }
    520   1.1  pooka 
    521   1.1  pooka int
    522   1.1  pooka rumpuser_getenv(const char *name, char *buf, size_t blen, int *error)
    523   1.1  pooka {
    524   1.1  pooka 
    525   1.1  pooka 	DOCALL(int, getenv_r(name, buf, blen));
    526   1.1  pooka }
    527   1.1  pooka 
    528   1.1  pooka int
    529   1.1  pooka rumpuser_gethostname(char *name, size_t namelen, int *error)
    530   1.1  pooka {
    531  1.13  pooka 	char tmp[MAXHOSTNAMELEN];
    532   1.1  pooka 
    533  1.13  pooka 	if (gethostname(tmp, sizeof(tmp)) == -1) {
    534  1.13  pooka 		snprintf(name, namelen, "rump-%05d.rumpdomain", getpid());
    535  1.13  pooka 	} else {
    536  1.13  pooka 		snprintf(name, namelen, "rump-%05d.%s.rumpdomain",
    537  1.13  pooka 		    getpid(), tmp);
    538  1.13  pooka 	}
    539  1.13  pooka 
    540  1.13  pooka 	*error = 0;
    541  1.13  pooka 	return 0;
    542   1.1  pooka }
    543   1.1  pooka 
    544   1.1  pooka int
    545   1.1  pooka rumpuser_poll(struct pollfd *fds, int nfds, int timeout, int *error)
    546   1.1  pooka {
    547   1.1  pooka 
    548   1.1  pooka 	DOCALL_KLOCK(int, (poll(fds, (nfds_t)nfds, timeout)));
    549   1.1  pooka }
    550   1.1  pooka 
    551   1.1  pooka int
    552   1.1  pooka rumpuser_putchar(int c, int *error)
    553   1.1  pooka {
    554   1.1  pooka 
    555   1.1  pooka 	DOCALL(int, (putchar(c)));
    556   1.1  pooka }
    557   1.1  pooka 
    558   1.1  pooka void
    559   1.1  pooka rumpuser_exit(int rv)
    560   1.1  pooka {
    561   1.1  pooka 
    562   1.1  pooka 	if (rv == RUMPUSER_PANIC)
    563   1.1  pooka 		abort();
    564   1.1  pooka 	else
    565   1.1  pooka 		exit(rv);
    566   1.1  pooka }
    567   1.1  pooka 
    568   1.1  pooka void
    569   1.1  pooka rumpuser_seterrno(int error)
    570   1.1  pooka {
    571   1.1  pooka 
    572   1.1  pooka 	errno = error;
    573   1.1  pooka }
    574   1.1  pooka 
    575  1.21  pooka /*
    576  1.21  pooka  * On NetBSD we use kqueue, on Linux we use inotify.  The underlying
    577  1.21  pooka  * interface requirements aren't quite the same, but we have a very
    578  1.21  pooka  * good chance of doing the fd->path mapping on Linux thanks to dcache,
    579  1.21  pooka  * so just keep the existing interfaces for now.
    580  1.21  pooka  */
    581  1.21  pooka #if defined(__NetBSD__)
    582   1.1  pooka int
    583   1.1  pooka rumpuser_writewatchfile_setup(int kq, int fd, intptr_t opaque, int *error)
    584   1.1  pooka {
    585   1.1  pooka 	struct kevent kev;
    586   1.1  pooka 
    587   1.1  pooka 	if (kq == -1) {
    588   1.1  pooka 		kq = kqueue();
    589   1.1  pooka 		if (kq == -1) {
    590  1.10  pooka 			seterror(errno);
    591   1.1  pooka 			return -1;
    592   1.1  pooka 		}
    593   1.1  pooka 	}
    594   1.1  pooka 
    595   1.1  pooka 	EV_SET(&kev, fd, EVFILT_VNODE, EV_ADD|EV_ENABLE|EV_CLEAR,
    596   1.1  pooka 	    NOTE_WRITE, 0, opaque);
    597   1.1  pooka 	if (kevent(kq, &kev, 1, NULL, 0, NULL) == -1) {
    598  1.10  pooka 		seterror(errno);
    599   1.1  pooka 		return -1;
    600   1.1  pooka 	}
    601   1.1  pooka 
    602   1.1  pooka 	return kq;
    603   1.1  pooka }
    604   1.1  pooka 
    605   1.1  pooka int
    606   1.1  pooka rumpuser_writewatchfile_wait(int kq, intptr_t *opaque, int *error)
    607   1.1  pooka {
    608   1.1  pooka 	struct kevent kev;
    609   1.1  pooka 	int rv;
    610   1.1  pooka 
    611   1.9  pooka  again:
    612   1.1  pooka 	KLOCK_WRAP(rv = kevent(kq, NULL, 0, &kev, 1, NULL));
    613   1.1  pooka 	if (rv == -1) {
    614   1.9  pooka 		if (errno == EINTR)
    615   1.9  pooka 			goto again;
    616  1.10  pooka 		seterror(errno);
    617   1.1  pooka 		return -1;
    618   1.1  pooka 	}
    619   1.1  pooka 
    620   1.1  pooka 	if (opaque)
    621   1.1  pooka 		*opaque = kev.udata;
    622   1.1  pooka 	return rv;
    623   1.1  pooka }
    624  1.21  pooka 
    625  1.21  pooka #elif defined(__linux__)
    626  1.21  pooka #include <sys/inotify.h>
    627  1.21  pooka 
    628  1.21  pooka int
    629  1.21  pooka rumpuser_writewatchfile_setup(int inotify, int fd, intptr_t notused, int *error)
    630  1.21  pooka {
    631  1.21  pooka 	char procbuf[PATH_MAX], linkbuf[PATH_MAX];
    632  1.21  pooka 	ssize_t nn;
    633  1.21  pooka 
    634  1.21  pooka 	if (inotify == -1) {
    635  1.21  pooka 		inotify = inotify_init();
    636  1.21  pooka 		if (inotify == -1) {
    637  1.21  pooka 			seterror(errno);
    638  1.21  pooka 			return -1;
    639  1.21  pooka 		}
    640  1.21  pooka 	}
    641  1.21  pooka 
    642  1.21  pooka 	/* ok, need to map fd into path for inotify */
    643  1.21  pooka 	snprintf(procbuf, sizeof(procbuf), "/proc/self/fd/%d", fd);
    644  1.21  pooka 	nn = readlink(procbuf, linkbuf, sizeof(linkbuf));
    645  1.21  pooka 	if (nn >= (ssize_t)sizeof(linkbuf)) {
    646  1.21  pooka 		nn = -1;
    647  1.21  pooka 		errno = E2BIG; /* pick something */
    648  1.21  pooka 	}
    649  1.21  pooka 	if (nn == -1) {
    650  1.21  pooka 		seterror(errno);
    651  1.21  pooka 		close(inotify);
    652  1.21  pooka 		return -1;
    653  1.21  pooka 	}
    654  1.21  pooka 
    655  1.21  pooka 	if (inotify_add_watch(inotify, linkbuf, IN_MODIFY) == -1) {
    656  1.21  pooka 		seterror(errno);
    657  1.21  pooka 		close(inotify);
    658  1.21  pooka 		return -1;
    659  1.21  pooka 	}
    660  1.21  pooka 
    661  1.21  pooka 	return inotify;
    662  1.21  pooka }
    663  1.21  pooka 
    664  1.21  pooka int
    665  1.21  pooka rumpuser_writewatchfile_wait(int kq, intptr_t *opaque, int *error)
    666  1.21  pooka {
    667  1.21  pooka 	struct inotify_event iev;
    668  1.21  pooka 	ssize_t nn;
    669  1.21  pooka 
    670  1.21  pooka 	do {
    671  1.21  pooka 		KLOCK_WRAP(nn = read(kq, &iev, sizeof(iev)));
    672  1.21  pooka 	} while (errno == EINTR);
    673  1.21  pooka 
    674  1.21  pooka 	if (nn == -1) {
    675  1.21  pooka 		seterror(errno);
    676  1.21  pooka 		return -1;
    677  1.21  pooka 	}
    678  1.21  pooka 	return (nn/sizeof(iev));
    679  1.21  pooka }
    680  1.18  pooka #endif
    681   1.1  pooka 
    682   1.1  pooka /*
    683   1.1  pooka  * This is meant for safe debugging prints from the kernel.
    684   1.1  pooka  */
    685   1.1  pooka int
    686   1.1  pooka rumpuser_dprintf(const char *format, ...)
    687   1.1  pooka {
    688   1.1  pooka 	va_list ap;
    689   1.1  pooka 	int rv;
    690   1.1  pooka 
    691   1.1  pooka 	va_start(ap, format);
    692   1.9  pooka 	rv = vfprintf(stderr, format, ap);
    693   1.1  pooka 	va_end(ap);
    694   1.1  pooka 
    695   1.1  pooka 	return rv;
    696   1.1  pooka }
    697   1.2  pooka 
    698   1.2  pooka int
    699   1.2  pooka rumpuser_kill(int64_t pid, int sig, int *error)
    700   1.2  pooka {
    701   1.2  pooka 
    702   1.3  pooka #ifdef __NetBSD__
    703   1.2  pooka 	if (pid == RUMPUSER_PID_SELF) {
    704   1.2  pooka 		DOCALL(int, raise(sig));
    705   1.2  pooka 	} else {
    706   1.2  pooka 		DOCALL(int, kill((pid_t)pid, sig));
    707   1.2  pooka 	}
    708   1.3  pooka #else
    709   1.3  pooka 	/* XXXfixme: signal numbers may not match on non-NetBSD */
    710  1.10  pooka 	seterror(EOPNOTSUPP);
    711   1.3  pooka 	return -1;
    712   1.3  pooka #endif
    713   1.2  pooka }
    714   1.4  pooka 
    715   1.4  pooka int
    716   1.4  pooka rumpuser_getnhostcpu(void)
    717   1.4  pooka {
    718  1.18  pooka 	int ncpu = 1;
    719  1.18  pooka 
    720  1.18  pooka #ifdef __NetBSD__
    721   1.4  pooka 	size_t sz = sizeof(ncpu);
    722   1.4  pooka 
    723  1.18  pooka 	sysctlbyname("hw.ncpu", &ncpu, &sz, NULL, 0);
    724  1.18  pooka #elif __linux__
    725  1.18  pooka 	FILE *fp;
    726  1.18  pooka 	char *line = NULL;
    727  1.18  pooka 	size_t n = 0;
    728  1.18  pooka 
    729  1.18  pooka 	/* If anyone knows a better way, I'm all ears */
    730  1.18  pooka 	if ((fp = fopen("/proc/cpuinfo", "r")) != NULL) {
    731  1.18  pooka 		ncpu = 0;
    732  1.18  pooka 		while (getline(&line, &n, fp) != -1) {
    733  1.18  pooka 			if (strncmp(line,
    734  1.18  pooka 			    "processor", sizeof("processor")-1) == 0)
    735  1.18  pooka 			    	ncpu++;
    736  1.18  pooka 		}
    737  1.18  pooka 		if (ncpu == 0)
    738  1.18  pooka 			ncpu = 1;
    739  1.18  pooka 		free(line);
    740  1.18  pooka 		fclose(fp);
    741  1.18  pooka 	}
    742  1.18  pooka #endif
    743  1.18  pooka 
    744   1.4  pooka 	return ncpu;
    745   1.4  pooka }
    746  1.16    tls 
    747  1.18  pooka /* XXX: this hypercall needs a better name */
    748  1.16    tls uint32_t
    749  1.16    tls rumpuser_arc4random(void)
    750  1.16    tls {
    751  1.18  pooka 
    752  1.16    tls 	return arc4random();
    753  1.16    tls }
    754