Home | History | Annotate | Line # | Download | only in librumpuser
rumpuser.c revision 1.30
      1  1.30  pooka /*	$NetBSD: rumpuser.c,v 1.30 2013/04/27 14:59:08 pooka Exp $	*/
      2   1.1  pooka 
      3   1.1  pooka /*
      4   1.1  pooka  * Copyright (c) 2007-2010 Antti Kantee.  All Rights Reserved.
      5   1.1  pooka  *
      6   1.1  pooka  * Redistribution and use in source and binary forms, with or without
      7   1.1  pooka  * modification, are permitted provided that the following conditions
      8   1.1  pooka  * are met:
      9   1.1  pooka  * 1. Redistributions of source code must retain the above copyright
     10   1.1  pooka  *    notice, this list of conditions and the following disclaimer.
     11   1.1  pooka  * 2. Redistributions in binary form must reproduce the above copyright
     12   1.1  pooka  *    notice, this list of conditions and the following disclaimer in the
     13   1.1  pooka  *    documentation and/or other materials provided with the distribution.
     14   1.1  pooka  *
     15   1.1  pooka  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
     16   1.1  pooka  * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
     17   1.1  pooka  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
     18   1.1  pooka  * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     19   1.1  pooka  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     20   1.1  pooka  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
     21   1.1  pooka  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     22   1.1  pooka  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     23   1.1  pooka  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     24   1.1  pooka  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     25   1.1  pooka  * SUCH DAMAGE.
     26   1.1  pooka  */
     27   1.1  pooka 
     28  1.18  pooka #include "rumpuser_port.h"
     29  1.18  pooka 
     30   1.1  pooka #if !defined(lint)
     31  1.30  pooka __RCSID("$NetBSD: rumpuser.c,v 1.30 2013/04/27 14:59:08 pooka Exp $");
     32   1.1  pooka #endif /* !lint */
     33   1.1  pooka 
     34   1.1  pooka #include <sys/ioctl.h>
     35   1.1  pooka #include <sys/mman.h>
     36   1.1  pooka #include <sys/uio.h>
     37  1.18  pooka #include <sys/stat.h>
     38  1.18  pooka #include <sys/time.h>
     39   1.1  pooka 
     40   1.1  pooka #ifdef __NetBSD__
     41  1.15  pooka #include <sys/disk.h>
     42   1.1  pooka #include <sys/disklabel.h>
     43  1.15  pooka #include <sys/dkio.h>
     44  1.25  pooka #include <sys/event.h>
     45  1.25  pooka #endif
     46  1.25  pooka 
     47  1.25  pooka #if defined(__NetBSD__) || defined(__FreeBSD__) || defined(__DragonFly__)
     48   1.4  pooka #include <sys/sysctl.h>
     49   1.1  pooka #endif
     50   1.1  pooka 
     51   1.1  pooka #include <assert.h>
     52   1.1  pooka #include <errno.h>
     53   1.1  pooka #include <fcntl.h>
     54  1.23  pooka #include <netdb.h>
     55   1.1  pooka #include <poll.h>
     56   1.2  pooka #include <signal.h>
     57   1.1  pooka #include <stdarg.h>
     58   1.1  pooka #include <stdint.h>
     59   1.1  pooka #include <stdio.h>
     60   1.1  pooka #include <stdlib.h>
     61   1.1  pooka #include <string.h>
     62   1.1  pooka #include <time.h>
     63   1.1  pooka #include <unistd.h>
     64   1.1  pooka 
     65   1.1  pooka #include <rump/rumpuser.h>
     66   1.1  pooka 
     67   1.1  pooka #include "rumpuser_int.h"
     68   1.1  pooka 
     69  1.30  pooka rump_unschedulefn	rumpuser__unschedule;
     70  1.30  pooka rump_reschedulefn	rumpuser__reschedule;
     71  1.30  pooka 
     72   1.1  pooka int
     73  1.30  pooka rumpuser_init(int version,
     74  1.30  pooka 	rump_reschedulefn rumpkern_resched, rump_unschedulefn rumpkern_unsched)
     75   1.8  pooka {
     76   1.8  pooka 
     77  1.30  pooka 	if (version != RUMPUSER_VERSION) {
     78  1.30  pooka 		fprintf(stderr, "rumpuser mismatch, kern: %d, hypervisor %d\n",
     79  1.30  pooka 		    version, RUMPUSER_VERSION);
     80  1.30  pooka 		return 1;
     81  1.30  pooka 	}
     82  1.30  pooka 
     83  1.30  pooka #ifdef RUMPUSER_USE_RANDOM
     84  1.30  pooka 	uint32_t rv;
     85  1.30  pooka 	int fd;
     86  1.30  pooka 
     87  1.30  pooka 	if ((fd = open("/dev/urandom", O_RDONLY)) == -1) {
     88  1.30  pooka 		srandom(time(NULL));
     89  1.30  pooka 	} else {
     90  1.30  pooka 		if (read(fd, &rv, sizeof(rv)) != sizeof(rv))
     91  1.30  pooka 			srandom(time(NULL));
     92  1.30  pooka 		else
     93  1.30  pooka 			srandom(rv);
     94  1.30  pooka 		close(fd);
     95  1.30  pooka 	}
     96  1.30  pooka #endif
     97  1.30  pooka 
     98  1.30  pooka 	rumpuser__thrinit();
     99  1.30  pooka 
    100  1.30  pooka 	rumpuser__unschedule = rumpkern_unsched;
    101  1.30  pooka 	rumpuser__reschedule = rumpkern_resched;
    102  1.30  pooka 
    103  1.30  pooka 	return 0;
    104   1.8  pooka }
    105   1.8  pooka 
    106   1.8  pooka int
    107   1.1  pooka rumpuser_getfileinfo(const char *path, uint64_t *sizep, int *ftp, int *error)
    108   1.1  pooka {
    109   1.1  pooka 	struct stat sb;
    110   1.1  pooka 	uint64_t size;
    111   1.1  pooka 	int needsdev = 0, rv = 0, ft;
    112  1.12  pooka 	int fd = -1;
    113   1.1  pooka 
    114   1.1  pooka 	if (stat(path, &sb) == -1) {
    115  1.10  pooka 		seterror(errno);
    116   1.1  pooka 		return -1;
    117   1.1  pooka 	}
    118   1.1  pooka 
    119   1.1  pooka 	switch (sb.st_mode & S_IFMT) {
    120   1.1  pooka 	case S_IFDIR:
    121   1.1  pooka 		ft = RUMPUSER_FT_DIR;
    122   1.1  pooka 		break;
    123   1.1  pooka 	case S_IFREG:
    124   1.1  pooka 		ft = RUMPUSER_FT_REG;
    125   1.1  pooka 		break;
    126   1.1  pooka 	case S_IFBLK:
    127   1.1  pooka 		ft = RUMPUSER_FT_BLK;
    128   1.1  pooka 		needsdev = 1;
    129   1.1  pooka 		break;
    130   1.1  pooka 	case S_IFCHR:
    131   1.1  pooka 		ft = RUMPUSER_FT_CHR;
    132   1.1  pooka 		needsdev = 1;
    133   1.1  pooka 		break;
    134   1.1  pooka 	default:
    135   1.1  pooka 		ft = RUMPUSER_FT_OTHER;
    136   1.1  pooka 		break;
    137   1.1  pooka 	}
    138   1.1  pooka 
    139   1.1  pooka 	if (!needsdev) {
    140   1.1  pooka 		size = sb.st_size;
    141   1.1  pooka 	} else if (sizep) {
    142   1.1  pooka 		/*
    143   1.1  pooka 		 * Welcome to the jungle.  Of course querying the kernel
    144   1.1  pooka 		 * for a device partition size is supposed to be far from
    145   1.1  pooka 		 * trivial.  On NetBSD we use ioctl.  On $other platform
    146   1.1  pooka 		 * we have a problem.  We try "the lseek trick" and just
    147   1.1  pooka 		 * fail if that fails.  Platform specific code can later
    148   1.1  pooka 		 * be written here if appropriate.
    149   1.1  pooka 		 *
    150   1.1  pooka 		 * On NetBSD we hope and pray that for block devices nobody
    151   1.1  pooka 		 * else is holding them open, because otherwise the kernel
    152   1.1  pooka 		 * will not permit us to open it.  Thankfully, this is
    153   1.1  pooka 		 * usually called only in bootstrap and then we can
    154   1.1  pooka 		 * forget about it.
    155   1.1  pooka 		 */
    156   1.1  pooka #ifndef __NetBSD__
    157   1.1  pooka 		off_t off;
    158   1.1  pooka 
    159   1.1  pooka 		fd = open(path, O_RDONLY);
    160   1.1  pooka 		if (fd == -1) {
    161  1.10  pooka 			seterror(errno);
    162   1.1  pooka 			rv = -1;
    163   1.1  pooka 			goto out;
    164   1.1  pooka 		}
    165   1.1  pooka 
    166   1.1  pooka 		off = lseek(fd, 0, SEEK_END);
    167   1.1  pooka 		if (off != 0) {
    168   1.1  pooka 			size = off;
    169   1.1  pooka 			goto out;
    170   1.1  pooka 		}
    171   1.1  pooka 		fprintf(stderr, "error: device size query not implemented on "
    172   1.1  pooka 		    "this platform\n");
    173  1.12  pooka 		seterror(EOPNOTSUPP);
    174   1.1  pooka 		rv = -1;
    175   1.1  pooka 		goto out;
    176   1.1  pooka #else
    177   1.1  pooka 		struct disklabel lab;
    178   1.1  pooka 		struct partition *parta;
    179  1.15  pooka 		struct dkwedge_info dkw;
    180   1.1  pooka 
    181   1.1  pooka 		fd = open(path, O_RDONLY);
    182   1.1  pooka 		if (fd == -1) {
    183  1.10  pooka 			seterror(errno);
    184   1.1  pooka 			rv = -1;
    185   1.1  pooka 			goto out;
    186   1.1  pooka 		}
    187   1.1  pooka 
    188  1.15  pooka 		if (ioctl(fd, DIOCGDINFO, &lab) == 0) {
    189  1.15  pooka 			parta = &lab.d_partitions[DISKPART(sb.st_rdev)];
    190  1.15  pooka 			size = (uint64_t)lab.d_secsize * parta->p_size;
    191  1.15  pooka 			goto out;
    192  1.15  pooka 		}
    193  1.15  pooka 
    194  1.15  pooka 		if (ioctl(fd, DIOCGWEDGEINFO, &dkw) == 0) {
    195  1.15  pooka 			/*
    196  1.15  pooka 			 * XXX: should use DIOCGDISKINFO to query
    197  1.15  pooka 			 * sector size, but that requires proplib,
    198  1.15  pooka 			 * so just don't bother for now.  it's nice
    199  1.15  pooka 			 * that something as difficult as figuring out
    200  1.15  pooka 			 * a partition's size has been made so easy.
    201  1.15  pooka 			 */
    202  1.15  pooka 			size = dkw.dkw_size << DEV_BSHIFT;
    203   1.1  pooka 			goto out;
    204   1.1  pooka 		}
    205   1.1  pooka 
    206  1.15  pooka 		seterror(errno);
    207  1.15  pooka 		rv = -1;
    208   1.1  pooka #endif /* __NetBSD__ */
    209   1.1  pooka 	}
    210   1.1  pooka 
    211   1.1  pooka  out:
    212   1.1  pooka 	if (rv == 0 && sizep)
    213   1.1  pooka 		*sizep = size;
    214   1.1  pooka 	if (rv == 0 && ftp)
    215   1.1  pooka 		*ftp = ft;
    216  1.12  pooka 	if (fd != -1)
    217  1.12  pooka 		close(fd);
    218   1.1  pooka 
    219   1.1  pooka 	return rv;
    220   1.1  pooka }
    221   1.1  pooka 
    222   1.1  pooka int
    223   1.1  pooka rumpuser_nanosleep(uint64_t *sec, uint64_t *nsec, int *error)
    224   1.1  pooka {
    225   1.1  pooka 	struct timespec rqt, rmt;
    226   1.1  pooka 	int rv;
    227   1.1  pooka 
    228   1.1  pooka 	/*LINTED*/
    229   1.1  pooka 	rqt.tv_sec = *sec;
    230   1.1  pooka 	/*LINTED*/
    231   1.1  pooka 	rqt.tv_nsec = *nsec;
    232   1.1  pooka 
    233   1.1  pooka 	KLOCK_WRAP(rv = nanosleep(&rqt, &rmt));
    234   1.1  pooka 	if (rv == -1)
    235  1.10  pooka 		seterror(errno);
    236   1.1  pooka 
    237   1.1  pooka 	*sec = rmt.tv_sec;
    238   1.1  pooka 	*nsec = rmt.tv_nsec;
    239   1.1  pooka 
    240   1.1  pooka 	return rv;
    241   1.1  pooka }
    242   1.1  pooka 
    243   1.1  pooka void *
    244   1.5  pooka rumpuser_malloc(size_t howmuch, int alignment)
    245   1.1  pooka {
    246   1.5  pooka 	void *mem;
    247   1.6  pooka 	int rv;
    248   1.5  pooka 
    249   1.5  pooka 	if (alignment == 0)
    250   1.5  pooka 		alignment = sizeof(void *);
    251   1.1  pooka 
    252  1.14  pooka 	rv = posix_memalign(&mem, (size_t)alignment, howmuch);
    253   1.6  pooka 	if (__predict_false(rv != 0)) {
    254   1.6  pooka 		if (rv == EINVAL) {
    255   1.6  pooka 			printf("rumpuser_malloc: invalid alignment %d\n",
    256   1.6  pooka 			    alignment);
    257   1.6  pooka 			abort();
    258   1.6  pooka 		}
    259   1.6  pooka 		mem = NULL;
    260   1.6  pooka 	}
    261   1.1  pooka 
    262   1.5  pooka 	return mem;
    263   1.1  pooka }
    264   1.1  pooka 
    265   1.1  pooka void *
    266   1.5  pooka rumpuser_realloc(void *ptr, size_t howmuch)
    267   1.1  pooka {
    268   1.1  pooka 
    269   1.5  pooka 	return realloc(ptr, howmuch);
    270   1.1  pooka }
    271   1.1  pooka 
    272   1.1  pooka void
    273   1.1  pooka rumpuser_free(void *ptr)
    274   1.1  pooka {
    275   1.1  pooka 
    276   1.1  pooka 	free(ptr);
    277   1.1  pooka }
    278   1.1  pooka 
    279   1.1  pooka void *
    280   1.7  pooka rumpuser_anonmmap(void *prefaddr, size_t size, int alignbit,
    281   1.7  pooka 	int exec, int *error)
    282   1.1  pooka {
    283   1.1  pooka 	void *rv;
    284   1.1  pooka 	int prot;
    285   1.1  pooka 
    286  1.18  pooka #ifndef MAP_ALIGNED
    287  1.18  pooka #define MAP_ALIGNED(a) 0
    288  1.18  pooka 	if (alignbit)
    289  1.18  pooka 		fprintf(stderr, "rumpuser_anonmmap: warning, requested "
    290  1.18  pooka 		    "alignment not supported by hypervisor\n");
    291  1.18  pooka #endif
    292  1.18  pooka 
    293   1.1  pooka 	prot = PROT_READ|PROT_WRITE;
    294   1.1  pooka 	if (exec)
    295   1.1  pooka 		prot |= PROT_EXEC;
    296   1.7  pooka 	rv = mmap(prefaddr, size, prot,
    297  1.24  pooka 	    MAP_PRIVATE | MAP_ANON | MAP_ALIGNED(alignbit), -1, 0);
    298   1.1  pooka 	if (rv == MAP_FAILED) {
    299  1.10  pooka 		seterror(errno);
    300   1.1  pooka 		return NULL;
    301   1.1  pooka 	}
    302   1.1  pooka 	return rv;
    303   1.1  pooka }
    304   1.1  pooka 
    305   1.1  pooka void
    306   1.1  pooka rumpuser_unmap(void *addr, size_t len)
    307   1.1  pooka {
    308   1.1  pooka 	int rv;
    309   1.1  pooka 
    310   1.1  pooka 	rv = munmap(addr, len);
    311   1.1  pooka 	assert(rv == 0);
    312   1.1  pooka }
    313   1.1  pooka 
    314   1.1  pooka void *
    315   1.1  pooka rumpuser_filemmap(int fd, off_t offset, size_t len, int flags, int *error)
    316   1.1  pooka {
    317   1.1  pooka 	void *rv;
    318   1.1  pooka 	int mmflags, prot;
    319   1.1  pooka 
    320  1.22  pooka 	if (flags & RUMPUSER_FILEMMAP_TRUNCATE) {
    321  1.22  pooka 		if (ftruncate(fd, offset + len) == -1) {
    322  1.22  pooka 			seterror(errno);
    323  1.22  pooka 			return NULL;
    324  1.22  pooka 		}
    325  1.22  pooka 	}
    326   1.1  pooka 
    327  1.23  pooka /* it's implicit */
    328  1.23  pooka #if defined(__sun__) && !defined(MAP_FILE)
    329  1.23  pooka #define MAP_FILE 0
    330  1.23  pooka #endif
    331  1.23  pooka 
    332   1.1  pooka 	mmflags = MAP_FILE;
    333   1.1  pooka 	if (flags & RUMPUSER_FILEMMAP_SHARED)
    334   1.1  pooka 		mmflags |= MAP_SHARED;
    335   1.1  pooka 	else
    336   1.1  pooka 		mmflags |= MAP_PRIVATE;
    337   1.1  pooka 
    338   1.1  pooka 	prot = 0;
    339   1.1  pooka 	if (flags & RUMPUSER_FILEMMAP_READ)
    340   1.1  pooka 		prot |= PROT_READ;
    341   1.1  pooka 	if (flags & RUMPUSER_FILEMMAP_WRITE)
    342   1.1  pooka 		prot |= PROT_WRITE;
    343   1.1  pooka 
    344   1.1  pooka 	rv = mmap(NULL, len, PROT_READ|PROT_WRITE, mmflags, fd, offset);
    345   1.1  pooka 	if (rv == MAP_FAILED) {
    346  1.10  pooka 		seterror(errno);
    347   1.1  pooka 		return NULL;
    348   1.1  pooka 	}
    349   1.1  pooka 
    350  1.10  pooka 	seterror(0);
    351   1.1  pooka 	return rv;
    352   1.1  pooka }
    353   1.1  pooka 
    354   1.1  pooka int
    355   1.1  pooka rumpuser_memsync(void *addr, size_t len, int *error)
    356   1.1  pooka {
    357   1.1  pooka 
    358   1.1  pooka 	DOCALL_KLOCK(int, (msync(addr, len, MS_SYNC)));
    359   1.1  pooka }
    360   1.1  pooka 
    361   1.1  pooka int
    362  1.20  pooka rumpuser_open(const char *path, int ruflags, int *error)
    363   1.1  pooka {
    364  1.20  pooka 	int flags;
    365   1.1  pooka 
    366  1.20  pooka 	switch (ruflags & RUMPUSER_OPEN_ACCMODE) {
    367  1.20  pooka 	case RUMPUSER_OPEN_RDONLY:
    368  1.20  pooka 		flags = O_RDONLY;
    369  1.20  pooka 		break;
    370  1.20  pooka 	case RUMPUSER_OPEN_WRONLY:
    371  1.20  pooka 		flags = O_WRONLY;
    372  1.20  pooka 		break;
    373  1.20  pooka 	case RUMPUSER_OPEN_RDWR:
    374  1.20  pooka 		flags = O_RDWR;
    375  1.20  pooka 		break;
    376  1.20  pooka 	default:
    377  1.20  pooka 		*error = EINVAL;
    378  1.20  pooka 		return -1;
    379  1.20  pooka 	}
    380  1.20  pooka 
    381  1.20  pooka #define TESTSET(_ru_, _h_) if (ruflags & _ru_) flags |= _h_;
    382  1.20  pooka 	TESTSET(RUMPUSER_OPEN_CREATE, O_CREAT);
    383  1.20  pooka 	TESTSET(RUMPUSER_OPEN_EXCL, O_EXCL);
    384  1.23  pooka #ifdef O_DIRECT
    385  1.20  pooka 	TESTSET(RUMPUSER_OPEN_DIRECT, O_DIRECT);
    386  1.23  pooka #else
    387  1.23  pooka 	if (ruflags & RUMPUSER_OPEN_DIRECT) {
    388  1.23  pooka 		*error = EOPNOTSUPP;
    389  1.23  pooka 		return -1;
    390  1.23  pooka 	}
    391  1.23  pooka #endif
    392  1.20  pooka #undef TESTSET
    393  1.20  pooka 
    394  1.20  pooka 	DOCALL_KLOCK(int, (open(path, flags, 0644)));
    395   1.1  pooka }
    396   1.1  pooka 
    397   1.1  pooka int
    398   1.1  pooka rumpuser_ioctl(int fd, u_long cmd, void *data, int *error)
    399   1.1  pooka {
    400   1.1  pooka 
    401   1.1  pooka 	DOCALL_KLOCK(int, (ioctl(fd, cmd, data)));
    402   1.1  pooka }
    403   1.1  pooka 
    404   1.1  pooka int
    405   1.1  pooka rumpuser_close(int fd, int *error)
    406   1.1  pooka {
    407   1.1  pooka 
    408   1.1  pooka 	DOCALL(int, close(fd));
    409   1.1  pooka }
    410   1.1  pooka 
    411   1.1  pooka int
    412   1.1  pooka rumpuser_fsync(int fd, int *error)
    413   1.1  pooka {
    414   1.1  pooka 
    415   1.1  pooka 	DOCALL_KLOCK(int, fsync(fd));
    416   1.1  pooka }
    417   1.1  pooka 
    418   1.1  pooka ssize_t
    419   1.1  pooka rumpuser_read(int fd, void *data, size_t size, int *error)
    420   1.1  pooka {
    421   1.1  pooka 	ssize_t rv;
    422   1.1  pooka 
    423   1.1  pooka 	KLOCK_WRAP(rv = read(fd, data, size));
    424   1.1  pooka 	if (rv == -1)
    425  1.10  pooka 		seterror(errno);
    426   1.1  pooka 
    427   1.1  pooka 	return rv;
    428   1.1  pooka }
    429   1.1  pooka 
    430   1.1  pooka ssize_t
    431   1.1  pooka rumpuser_pread(int fd, void *data, size_t size, off_t offset, int *error)
    432   1.1  pooka {
    433   1.1  pooka 	ssize_t rv;
    434   1.1  pooka 
    435   1.1  pooka 	KLOCK_WRAP(rv = pread(fd, data, size, offset));
    436   1.1  pooka 	if (rv == -1)
    437  1.10  pooka 		seterror(errno);
    438   1.1  pooka 
    439   1.1  pooka 	return rv;
    440   1.1  pooka }
    441   1.1  pooka 
    442   1.1  pooka void
    443   1.1  pooka rumpuser_read_bio(int fd, void *data, size_t size, off_t offset,
    444   1.1  pooka 	rump_biodone_fn biodone, void *biodonecookie)
    445   1.1  pooka {
    446   1.1  pooka 	ssize_t rv;
    447   1.1  pooka 	int error = 0;
    448   1.1  pooka 
    449   1.1  pooka 	rv = rumpuser_pread(fd, data, size, offset, &error);
    450   1.1  pooka 	/* check against <0 instead of ==-1 to get typing below right */
    451   1.1  pooka 	if (rv < 0)
    452   1.1  pooka 		rv = 0;
    453   1.1  pooka 
    454   1.1  pooka 	/* LINTED: see above */
    455   1.1  pooka 	biodone(biodonecookie, rv, error);
    456   1.1  pooka }
    457   1.1  pooka 
    458   1.1  pooka ssize_t
    459   1.1  pooka rumpuser_write(int fd, const void *data, size_t size, int *error)
    460   1.1  pooka {
    461   1.1  pooka 	ssize_t rv;
    462   1.1  pooka 
    463   1.1  pooka 	KLOCK_WRAP(rv = write(fd, data, size));
    464   1.1  pooka 	if (rv == -1)
    465  1.10  pooka 		seterror(errno);
    466   1.1  pooka 
    467   1.1  pooka 	return rv;
    468   1.1  pooka }
    469   1.1  pooka 
    470   1.1  pooka ssize_t
    471   1.1  pooka rumpuser_pwrite(int fd, const void *data, size_t size, off_t offset, int *error)
    472   1.1  pooka {
    473   1.1  pooka 	ssize_t rv;
    474   1.1  pooka 
    475   1.1  pooka 	KLOCK_WRAP(rv = pwrite(fd, data, size, offset));
    476   1.1  pooka 	if (rv == -1)
    477  1.10  pooka 		seterror(errno);
    478   1.1  pooka 
    479   1.1  pooka 	return rv;
    480   1.1  pooka }
    481   1.1  pooka 
    482   1.1  pooka void
    483   1.1  pooka rumpuser_write_bio(int fd, const void *data, size_t size, off_t offset,
    484   1.1  pooka 	rump_biodone_fn biodone, void *biodonecookie)
    485   1.1  pooka {
    486   1.1  pooka 	ssize_t rv;
    487   1.1  pooka 	int error = 0;
    488   1.1  pooka 
    489   1.1  pooka 	rv = rumpuser_pwrite(fd, data, size, offset, &error);
    490   1.1  pooka 	/* check against <0 instead of ==-1 to get typing below right */
    491   1.1  pooka 	if (rv < 0)
    492   1.1  pooka 		rv = 0;
    493   1.1  pooka 
    494   1.1  pooka 	/* LINTED: see above */
    495   1.1  pooka 	biodone(biodonecookie, rv, error);
    496   1.1  pooka }
    497   1.1  pooka 
    498   1.1  pooka ssize_t
    499   1.1  pooka rumpuser_readv(int fd, const struct rumpuser_iovec *riov, int iovcnt,
    500   1.1  pooka 	int *error)
    501   1.1  pooka {
    502   1.1  pooka 	struct iovec *iovp;
    503   1.1  pooka 	ssize_t rv;
    504   1.1  pooka 	int i;
    505   1.1  pooka 
    506   1.1  pooka 	iovp = malloc(iovcnt * sizeof(struct iovec));
    507   1.1  pooka 	if (iovp == NULL) {
    508  1.10  pooka 		seterror(ENOMEM);
    509   1.1  pooka 		return -1;
    510   1.1  pooka 	}
    511   1.1  pooka 	for (i = 0; i < iovcnt; i++) {
    512   1.1  pooka 		iovp[i].iov_base = riov[i].iov_base;
    513   1.1  pooka 		/*LINTED*/
    514   1.1  pooka 		iovp[i].iov_len = riov[i].iov_len;
    515   1.1  pooka 	}
    516   1.1  pooka 
    517   1.1  pooka 	KLOCK_WRAP(rv = readv(fd, iovp, iovcnt));
    518   1.1  pooka 	if (rv == -1)
    519  1.10  pooka 		seterror(errno);
    520   1.1  pooka 	free(iovp);
    521   1.1  pooka 
    522   1.1  pooka 	return rv;
    523   1.1  pooka }
    524   1.1  pooka 
    525   1.1  pooka ssize_t
    526   1.1  pooka rumpuser_writev(int fd, const struct rumpuser_iovec *riov, int iovcnt,
    527   1.1  pooka 	int *error)
    528   1.1  pooka {
    529   1.1  pooka 	struct iovec *iovp;
    530   1.1  pooka 	ssize_t rv;
    531   1.1  pooka 	int i;
    532   1.1  pooka 
    533   1.1  pooka 	iovp = malloc(iovcnt * sizeof(struct iovec));
    534   1.1  pooka 	if (iovp == NULL) {
    535  1.10  pooka 		seterror(ENOMEM);
    536   1.1  pooka 		return -1;
    537   1.1  pooka 	}
    538   1.1  pooka 	for (i = 0; i < iovcnt; i++) {
    539   1.1  pooka 		iovp[i].iov_base = riov[i].iov_base;
    540   1.1  pooka 		/*LINTED*/
    541   1.1  pooka 		iovp[i].iov_len = riov[i].iov_len;
    542   1.1  pooka 	}
    543   1.1  pooka 
    544   1.1  pooka 	KLOCK_WRAP(rv = writev(fd, iovp, iovcnt));
    545   1.1  pooka 	if (rv == -1)
    546  1.10  pooka 		seterror(errno);
    547   1.1  pooka 	free(iovp);
    548   1.1  pooka 
    549   1.1  pooka 	return rv;
    550   1.1  pooka }
    551   1.1  pooka 
    552   1.1  pooka int
    553   1.1  pooka rumpuser_gettime(uint64_t *sec, uint64_t *nsec, int *error)
    554   1.1  pooka {
    555   1.1  pooka 	struct timeval tv;
    556   1.1  pooka 	int rv;
    557   1.1  pooka 
    558   1.1  pooka 	rv = gettimeofday(&tv, NULL);
    559   1.1  pooka 	if (rv == -1) {
    560  1.10  pooka 		seterror(errno);
    561   1.1  pooka 		return rv;
    562   1.1  pooka 	}
    563   1.1  pooka 
    564   1.1  pooka 	*sec = tv.tv_sec;
    565   1.1  pooka 	*nsec = tv.tv_usec * 1000;
    566   1.1  pooka 
    567   1.1  pooka 	return 0;
    568   1.1  pooka }
    569   1.1  pooka 
    570   1.1  pooka int
    571   1.1  pooka rumpuser_getenv(const char *name, char *buf, size_t blen, int *error)
    572   1.1  pooka {
    573   1.1  pooka 
    574   1.1  pooka 	DOCALL(int, getenv_r(name, buf, blen));
    575   1.1  pooka }
    576   1.1  pooka 
    577   1.1  pooka int
    578   1.1  pooka rumpuser_gethostname(char *name, size_t namelen, int *error)
    579   1.1  pooka {
    580  1.13  pooka 	char tmp[MAXHOSTNAMELEN];
    581   1.1  pooka 
    582  1.13  pooka 	if (gethostname(tmp, sizeof(tmp)) == -1) {
    583  1.23  pooka 		snprintf(name, namelen, "rump-%05d.rumpdomain", (int)getpid());
    584  1.13  pooka 	} else {
    585  1.13  pooka 		snprintf(name, namelen, "rump-%05d.%s.rumpdomain",
    586  1.23  pooka 		    (int)getpid(), tmp);
    587  1.13  pooka 	}
    588  1.13  pooka 
    589  1.13  pooka 	*error = 0;
    590  1.13  pooka 	return 0;
    591   1.1  pooka }
    592   1.1  pooka 
    593   1.1  pooka int
    594   1.1  pooka rumpuser_poll(struct pollfd *fds, int nfds, int timeout, int *error)
    595   1.1  pooka {
    596   1.1  pooka 
    597   1.1  pooka 	DOCALL_KLOCK(int, (poll(fds, (nfds_t)nfds, timeout)));
    598   1.1  pooka }
    599   1.1  pooka 
    600   1.1  pooka int
    601   1.1  pooka rumpuser_putchar(int c, int *error)
    602   1.1  pooka {
    603   1.1  pooka 
    604   1.1  pooka 	DOCALL(int, (putchar(c)));
    605   1.1  pooka }
    606   1.1  pooka 
    607   1.1  pooka void
    608   1.1  pooka rumpuser_exit(int rv)
    609   1.1  pooka {
    610   1.1  pooka 
    611   1.1  pooka 	if (rv == RUMPUSER_PANIC)
    612   1.1  pooka 		abort();
    613   1.1  pooka 	else
    614   1.1  pooka 		exit(rv);
    615   1.1  pooka }
    616   1.1  pooka 
    617   1.1  pooka void
    618   1.1  pooka rumpuser_seterrno(int error)
    619   1.1  pooka {
    620   1.1  pooka 
    621   1.1  pooka 	errno = error;
    622   1.1  pooka }
    623   1.1  pooka 
    624  1.21  pooka /*
    625  1.21  pooka  * On NetBSD we use kqueue, on Linux we use inotify.  The underlying
    626  1.21  pooka  * interface requirements aren't quite the same, but we have a very
    627  1.21  pooka  * good chance of doing the fd->path mapping on Linux thanks to dcache,
    628  1.21  pooka  * so just keep the existing interfaces for now.
    629  1.21  pooka  */
    630  1.21  pooka #if defined(__NetBSD__)
    631   1.1  pooka int
    632   1.1  pooka rumpuser_writewatchfile_setup(int kq, int fd, intptr_t opaque, int *error)
    633   1.1  pooka {
    634   1.1  pooka 	struct kevent kev;
    635   1.1  pooka 
    636   1.1  pooka 	if (kq == -1) {
    637   1.1  pooka 		kq = kqueue();
    638   1.1  pooka 		if (kq == -1) {
    639  1.10  pooka 			seterror(errno);
    640   1.1  pooka 			return -1;
    641   1.1  pooka 		}
    642   1.1  pooka 	}
    643   1.1  pooka 
    644   1.1  pooka 	EV_SET(&kev, fd, EVFILT_VNODE, EV_ADD|EV_ENABLE|EV_CLEAR,
    645   1.1  pooka 	    NOTE_WRITE, 0, opaque);
    646   1.1  pooka 	if (kevent(kq, &kev, 1, NULL, 0, NULL) == -1) {
    647  1.10  pooka 		seterror(errno);
    648   1.1  pooka 		return -1;
    649   1.1  pooka 	}
    650   1.1  pooka 
    651   1.1  pooka 	return kq;
    652   1.1  pooka }
    653   1.1  pooka 
    654   1.1  pooka int
    655   1.1  pooka rumpuser_writewatchfile_wait(int kq, intptr_t *opaque, int *error)
    656   1.1  pooka {
    657   1.1  pooka 	struct kevent kev;
    658   1.1  pooka 	int rv;
    659   1.1  pooka 
    660   1.9  pooka  again:
    661   1.1  pooka 	KLOCK_WRAP(rv = kevent(kq, NULL, 0, &kev, 1, NULL));
    662   1.1  pooka 	if (rv == -1) {
    663   1.9  pooka 		if (errno == EINTR)
    664   1.9  pooka 			goto again;
    665  1.10  pooka 		seterror(errno);
    666   1.1  pooka 		return -1;
    667   1.1  pooka 	}
    668   1.1  pooka 
    669   1.1  pooka 	if (opaque)
    670   1.1  pooka 		*opaque = kev.udata;
    671   1.1  pooka 	return rv;
    672   1.1  pooka }
    673  1.21  pooka 
    674  1.21  pooka #elif defined(__linux__)
    675  1.21  pooka #include <sys/inotify.h>
    676  1.21  pooka 
    677  1.21  pooka int
    678  1.21  pooka rumpuser_writewatchfile_setup(int inotify, int fd, intptr_t notused, int *error)
    679  1.21  pooka {
    680  1.21  pooka 	char procbuf[PATH_MAX], linkbuf[PATH_MAX];
    681  1.21  pooka 	ssize_t nn;
    682  1.21  pooka 
    683  1.21  pooka 	if (inotify == -1) {
    684  1.21  pooka 		inotify = inotify_init();
    685  1.21  pooka 		if (inotify == -1) {
    686  1.21  pooka 			seterror(errno);
    687  1.21  pooka 			return -1;
    688  1.21  pooka 		}
    689  1.21  pooka 	}
    690  1.21  pooka 
    691  1.21  pooka 	/* ok, need to map fd into path for inotify */
    692  1.21  pooka 	snprintf(procbuf, sizeof(procbuf), "/proc/self/fd/%d", fd);
    693  1.29  pooka 	nn = readlink(procbuf, linkbuf, sizeof(linkbuf)-1);
    694  1.29  pooka 	if (nn >= (ssize_t)sizeof(linkbuf)-1) {
    695  1.21  pooka 		nn = -1;
    696  1.21  pooka 		errno = E2BIG; /* pick something */
    697  1.21  pooka 	}
    698  1.21  pooka 	if (nn == -1) {
    699  1.21  pooka 		seterror(errno);
    700  1.21  pooka 		close(inotify);
    701  1.21  pooka 		return -1;
    702  1.21  pooka 	}
    703  1.21  pooka 
    704  1.29  pooka 	linkbuf[nn] = '\0';
    705  1.21  pooka 	if (inotify_add_watch(inotify, linkbuf, IN_MODIFY) == -1) {
    706  1.21  pooka 		seterror(errno);
    707  1.21  pooka 		close(inotify);
    708  1.21  pooka 		return -1;
    709  1.21  pooka 	}
    710  1.21  pooka 
    711  1.21  pooka 	return inotify;
    712  1.21  pooka }
    713  1.21  pooka 
    714  1.21  pooka int
    715  1.21  pooka rumpuser_writewatchfile_wait(int kq, intptr_t *opaque, int *error)
    716  1.21  pooka {
    717  1.21  pooka 	struct inotify_event iev;
    718  1.21  pooka 	ssize_t nn;
    719  1.21  pooka 
    720  1.21  pooka 	do {
    721  1.21  pooka 		KLOCK_WRAP(nn = read(kq, &iev, sizeof(iev)));
    722  1.21  pooka 	} while (errno == EINTR);
    723  1.21  pooka 
    724  1.21  pooka 	if (nn == -1) {
    725  1.21  pooka 		seterror(errno);
    726  1.21  pooka 		return -1;
    727  1.21  pooka 	}
    728  1.21  pooka 	return (nn/sizeof(iev));
    729  1.21  pooka }
    730  1.26  pooka 
    731  1.26  pooka #else
    732  1.26  pooka 
    733  1.26  pooka /* a polling default implementation */
    734  1.26  pooka int
    735  1.26  pooka rumpuser_writewatchfile_setup(int inotify, int fd, intptr_t notused, int *error)
    736  1.26  pooka {
    737  1.26  pooka 	static int warned = 0;
    738  1.26  pooka 
    739  1.26  pooka 	if (!warned) {
    740  1.27  pooka 		fprintf(stderr, "WARNING: rumpuser writewatchfile routines are "
    741  1.26  pooka 		    "polling-only on this platform\n");
    742  1.26  pooka 		warned = 1;
    743  1.26  pooka 	}
    744  1.26  pooka 
    745  1.26  pooka 	return 0;
    746  1.26  pooka }
    747  1.26  pooka 
    748  1.26  pooka int
    749  1.26  pooka rumpuser_writewatchfile_wait(int kq, intptr_t *opaque, int *error)
    750  1.26  pooka {
    751  1.26  pooka 
    752  1.26  pooka 	KLOCK_WRAP(usleep(10000));
    753  1.26  pooka 	return 0;
    754  1.26  pooka }
    755  1.18  pooka #endif
    756   1.1  pooka 
    757   1.1  pooka /*
    758   1.1  pooka  * This is meant for safe debugging prints from the kernel.
    759   1.1  pooka  */
    760   1.1  pooka int
    761   1.1  pooka rumpuser_dprintf(const char *format, ...)
    762   1.1  pooka {
    763   1.1  pooka 	va_list ap;
    764   1.1  pooka 	int rv;
    765   1.1  pooka 
    766   1.1  pooka 	va_start(ap, format);
    767   1.9  pooka 	rv = vfprintf(stderr, format, ap);
    768   1.1  pooka 	va_end(ap);
    769   1.1  pooka 
    770   1.1  pooka 	return rv;
    771   1.1  pooka }
    772   1.2  pooka 
    773   1.2  pooka int
    774   1.2  pooka rumpuser_kill(int64_t pid, int sig, int *error)
    775   1.2  pooka {
    776   1.2  pooka 
    777   1.3  pooka #ifdef __NetBSD__
    778   1.2  pooka 	if (pid == RUMPUSER_PID_SELF) {
    779   1.2  pooka 		DOCALL(int, raise(sig));
    780   1.2  pooka 	} else {
    781   1.2  pooka 		DOCALL(int, kill((pid_t)pid, sig));
    782   1.2  pooka 	}
    783   1.3  pooka #else
    784   1.3  pooka 	/* XXXfixme: signal numbers may not match on non-NetBSD */
    785  1.10  pooka 	seterror(EOPNOTSUPP);
    786   1.3  pooka 	return -1;
    787   1.3  pooka #endif
    788   1.2  pooka }
    789   1.4  pooka 
    790   1.4  pooka int
    791   1.4  pooka rumpuser_getnhostcpu(void)
    792   1.4  pooka {
    793  1.18  pooka 	int ncpu = 1;
    794  1.18  pooka 
    795  1.25  pooka #if defined(__NetBSD__) || defined(__FreeBSD__) || defined(__DragonFly__)
    796   1.4  pooka 	size_t sz = sizeof(ncpu);
    797   1.4  pooka 
    798  1.18  pooka 	sysctlbyname("hw.ncpu", &ncpu, &sz, NULL, 0);
    799  1.28  pooka #elif defined(__linux__) || defined(__CYGWIN__)
    800  1.18  pooka 	FILE *fp;
    801  1.18  pooka 	char *line = NULL;
    802  1.18  pooka 	size_t n = 0;
    803  1.18  pooka 
    804  1.18  pooka 	/* If anyone knows a better way, I'm all ears */
    805  1.18  pooka 	if ((fp = fopen("/proc/cpuinfo", "r")) != NULL) {
    806  1.18  pooka 		ncpu = 0;
    807  1.18  pooka 		while (getline(&line, &n, fp) != -1) {
    808  1.18  pooka 			if (strncmp(line,
    809  1.18  pooka 			    "processor", sizeof("processor")-1) == 0)
    810  1.18  pooka 			    	ncpu++;
    811  1.18  pooka 		}
    812  1.18  pooka 		if (ncpu == 0)
    813  1.18  pooka 			ncpu = 1;
    814  1.18  pooka 		free(line);
    815  1.18  pooka 		fclose(fp);
    816  1.18  pooka 	}
    817  1.23  pooka #elif __sun__
    818  1.23  pooka 	/* XXX: this is just a rough estimate ... */
    819  1.23  pooka 	ncpu = sysconf(_SC_NPROCESSORS_ONLN);
    820  1.18  pooka #endif
    821  1.18  pooka 
    822   1.4  pooka 	return ncpu;
    823   1.4  pooka }
    824  1.16    tls 
    825  1.18  pooka /* XXX: this hypercall needs a better name */
    826  1.16    tls uint32_t
    827  1.16    tls rumpuser_arc4random(void)
    828  1.16    tls {
    829  1.18  pooka 
    830  1.16    tls 	return arc4random();
    831  1.16    tls }
    832