Home | History | Annotate | Line # | Download | only in librumpuser
rumpuser.c revision 1.33
      1  1.33  pooka /*	$NetBSD: rumpuser.c,v 1.33 2013/04/27 16:56:29 pooka Exp $	*/
      2   1.1  pooka 
      3   1.1  pooka /*
      4   1.1  pooka  * Copyright (c) 2007-2010 Antti Kantee.  All Rights Reserved.
      5   1.1  pooka  *
      6   1.1  pooka  * Redistribution and use in source and binary forms, with or without
      7   1.1  pooka  * modification, are permitted provided that the following conditions
      8   1.1  pooka  * are met:
      9   1.1  pooka  * 1. Redistributions of source code must retain the above copyright
     10   1.1  pooka  *    notice, this list of conditions and the following disclaimer.
     11   1.1  pooka  * 2. Redistributions in binary form must reproduce the above copyright
     12   1.1  pooka  *    notice, this list of conditions and the following disclaimer in the
     13   1.1  pooka  *    documentation and/or other materials provided with the distribution.
     14   1.1  pooka  *
     15   1.1  pooka  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
     16   1.1  pooka  * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
     17   1.1  pooka  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
     18   1.1  pooka  * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     19   1.1  pooka  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     20   1.1  pooka  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
     21   1.1  pooka  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     22   1.1  pooka  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     23   1.1  pooka  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     24   1.1  pooka  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     25   1.1  pooka  * SUCH DAMAGE.
     26   1.1  pooka  */
     27   1.1  pooka 
     28  1.18  pooka #include "rumpuser_port.h"
     29  1.18  pooka 
     30   1.1  pooka #if !defined(lint)
     31  1.33  pooka __RCSID("$NetBSD: rumpuser.c,v 1.33 2013/04/27 16:56:29 pooka Exp $");
     32   1.1  pooka #endif /* !lint */
     33   1.1  pooka 
     34   1.1  pooka #include <sys/ioctl.h>
     35   1.1  pooka #include <sys/mman.h>
     36   1.1  pooka #include <sys/uio.h>
     37  1.18  pooka #include <sys/stat.h>
     38  1.18  pooka #include <sys/time.h>
     39   1.1  pooka 
     40   1.1  pooka #ifdef __NetBSD__
     41  1.15  pooka #include <sys/disk.h>
     42   1.1  pooka #include <sys/disklabel.h>
     43  1.15  pooka #include <sys/dkio.h>
     44  1.25  pooka #include <sys/event.h>
     45  1.25  pooka #endif
     46  1.25  pooka 
     47  1.25  pooka #if defined(__NetBSD__) || defined(__FreeBSD__) || defined(__DragonFly__)
     48   1.4  pooka #include <sys/sysctl.h>
     49   1.1  pooka #endif
     50   1.1  pooka 
     51   1.1  pooka #include <assert.h>
     52   1.1  pooka #include <errno.h>
     53   1.1  pooka #include <fcntl.h>
     54  1.23  pooka #include <netdb.h>
     55   1.2  pooka #include <signal.h>
     56   1.1  pooka #include <stdarg.h>
     57   1.1  pooka #include <stdint.h>
     58   1.1  pooka #include <stdio.h>
     59   1.1  pooka #include <stdlib.h>
     60   1.1  pooka #include <string.h>
     61   1.1  pooka #include <time.h>
     62   1.1  pooka #include <unistd.h>
     63   1.1  pooka 
     64   1.1  pooka #include <rump/rumpuser.h>
     65   1.1  pooka 
     66   1.1  pooka #include "rumpuser_int.h"
     67   1.1  pooka 
     68  1.30  pooka rump_unschedulefn	rumpuser__unschedule;
     69  1.30  pooka rump_reschedulefn	rumpuser__reschedule;
     70  1.30  pooka 
     71   1.1  pooka int
     72  1.30  pooka rumpuser_init(int version,
     73  1.30  pooka 	rump_reschedulefn rumpkern_resched, rump_unschedulefn rumpkern_unsched)
     74   1.8  pooka {
     75   1.8  pooka 
     76  1.30  pooka 	if (version != RUMPUSER_VERSION) {
     77  1.30  pooka 		fprintf(stderr, "rumpuser mismatch, kern: %d, hypervisor %d\n",
     78  1.30  pooka 		    version, RUMPUSER_VERSION);
     79  1.30  pooka 		return 1;
     80  1.30  pooka 	}
     81  1.30  pooka 
     82  1.33  pooka #ifdef RUMPUSER_USE_DEVRANDOM
     83  1.30  pooka 	uint32_t rv;
     84  1.30  pooka 	int fd;
     85  1.30  pooka 
     86  1.30  pooka 	if ((fd = open("/dev/urandom", O_RDONLY)) == -1) {
     87  1.30  pooka 		srandom(time(NULL));
     88  1.30  pooka 	} else {
     89  1.30  pooka 		if (read(fd, &rv, sizeof(rv)) != sizeof(rv))
     90  1.30  pooka 			srandom(time(NULL));
     91  1.30  pooka 		else
     92  1.30  pooka 			srandom(rv);
     93  1.30  pooka 		close(fd);
     94  1.30  pooka 	}
     95  1.30  pooka #endif
     96  1.30  pooka 
     97  1.30  pooka 	rumpuser__thrinit();
     98  1.30  pooka 
     99  1.30  pooka 	rumpuser__unschedule = rumpkern_unsched;
    100  1.30  pooka 	rumpuser__reschedule = rumpkern_resched;
    101  1.30  pooka 
    102  1.30  pooka 	return 0;
    103   1.8  pooka }
    104   1.8  pooka 
    105   1.8  pooka int
    106   1.1  pooka rumpuser_getfileinfo(const char *path, uint64_t *sizep, int *ftp, int *error)
    107   1.1  pooka {
    108   1.1  pooka 	struct stat sb;
    109   1.1  pooka 	uint64_t size;
    110   1.1  pooka 	int needsdev = 0, rv = 0, ft;
    111  1.12  pooka 	int fd = -1;
    112   1.1  pooka 
    113   1.1  pooka 	if (stat(path, &sb) == -1) {
    114  1.10  pooka 		seterror(errno);
    115   1.1  pooka 		return -1;
    116   1.1  pooka 	}
    117   1.1  pooka 
    118   1.1  pooka 	switch (sb.st_mode & S_IFMT) {
    119   1.1  pooka 	case S_IFDIR:
    120   1.1  pooka 		ft = RUMPUSER_FT_DIR;
    121   1.1  pooka 		break;
    122   1.1  pooka 	case S_IFREG:
    123   1.1  pooka 		ft = RUMPUSER_FT_REG;
    124   1.1  pooka 		break;
    125   1.1  pooka 	case S_IFBLK:
    126   1.1  pooka 		ft = RUMPUSER_FT_BLK;
    127   1.1  pooka 		needsdev = 1;
    128   1.1  pooka 		break;
    129   1.1  pooka 	case S_IFCHR:
    130   1.1  pooka 		ft = RUMPUSER_FT_CHR;
    131   1.1  pooka 		needsdev = 1;
    132   1.1  pooka 		break;
    133   1.1  pooka 	default:
    134   1.1  pooka 		ft = RUMPUSER_FT_OTHER;
    135   1.1  pooka 		break;
    136   1.1  pooka 	}
    137   1.1  pooka 
    138   1.1  pooka 	if (!needsdev) {
    139   1.1  pooka 		size = sb.st_size;
    140   1.1  pooka 	} else if (sizep) {
    141   1.1  pooka 		/*
    142   1.1  pooka 		 * Welcome to the jungle.  Of course querying the kernel
    143   1.1  pooka 		 * for a device partition size is supposed to be far from
    144   1.1  pooka 		 * trivial.  On NetBSD we use ioctl.  On $other platform
    145   1.1  pooka 		 * we have a problem.  We try "the lseek trick" and just
    146   1.1  pooka 		 * fail if that fails.  Platform specific code can later
    147   1.1  pooka 		 * be written here if appropriate.
    148   1.1  pooka 		 *
    149   1.1  pooka 		 * On NetBSD we hope and pray that for block devices nobody
    150   1.1  pooka 		 * else is holding them open, because otherwise the kernel
    151   1.1  pooka 		 * will not permit us to open it.  Thankfully, this is
    152   1.1  pooka 		 * usually called only in bootstrap and then we can
    153   1.1  pooka 		 * forget about it.
    154   1.1  pooka 		 */
    155   1.1  pooka #ifndef __NetBSD__
    156   1.1  pooka 		off_t off;
    157   1.1  pooka 
    158   1.1  pooka 		fd = open(path, O_RDONLY);
    159   1.1  pooka 		if (fd == -1) {
    160  1.10  pooka 			seterror(errno);
    161   1.1  pooka 			rv = -1;
    162   1.1  pooka 			goto out;
    163   1.1  pooka 		}
    164   1.1  pooka 
    165   1.1  pooka 		off = lseek(fd, 0, SEEK_END);
    166   1.1  pooka 		if (off != 0) {
    167   1.1  pooka 			size = off;
    168   1.1  pooka 			goto out;
    169   1.1  pooka 		}
    170   1.1  pooka 		fprintf(stderr, "error: device size query not implemented on "
    171   1.1  pooka 		    "this platform\n");
    172  1.12  pooka 		seterror(EOPNOTSUPP);
    173   1.1  pooka 		rv = -1;
    174   1.1  pooka 		goto out;
    175   1.1  pooka #else
    176   1.1  pooka 		struct disklabel lab;
    177   1.1  pooka 		struct partition *parta;
    178  1.15  pooka 		struct dkwedge_info dkw;
    179   1.1  pooka 
    180   1.1  pooka 		fd = open(path, O_RDONLY);
    181   1.1  pooka 		if (fd == -1) {
    182  1.10  pooka 			seterror(errno);
    183   1.1  pooka 			rv = -1;
    184   1.1  pooka 			goto out;
    185   1.1  pooka 		}
    186   1.1  pooka 
    187  1.15  pooka 		if (ioctl(fd, DIOCGDINFO, &lab) == 0) {
    188  1.15  pooka 			parta = &lab.d_partitions[DISKPART(sb.st_rdev)];
    189  1.15  pooka 			size = (uint64_t)lab.d_secsize * parta->p_size;
    190  1.15  pooka 			goto out;
    191  1.15  pooka 		}
    192  1.15  pooka 
    193  1.15  pooka 		if (ioctl(fd, DIOCGWEDGEINFO, &dkw) == 0) {
    194  1.15  pooka 			/*
    195  1.15  pooka 			 * XXX: should use DIOCGDISKINFO to query
    196  1.15  pooka 			 * sector size, but that requires proplib,
    197  1.15  pooka 			 * so just don't bother for now.  it's nice
    198  1.15  pooka 			 * that something as difficult as figuring out
    199  1.15  pooka 			 * a partition's size has been made so easy.
    200  1.15  pooka 			 */
    201  1.15  pooka 			size = dkw.dkw_size << DEV_BSHIFT;
    202   1.1  pooka 			goto out;
    203   1.1  pooka 		}
    204   1.1  pooka 
    205  1.15  pooka 		seterror(errno);
    206  1.15  pooka 		rv = -1;
    207   1.1  pooka #endif /* __NetBSD__ */
    208   1.1  pooka 	}
    209   1.1  pooka 
    210   1.1  pooka  out:
    211   1.1  pooka 	if (rv == 0 && sizep)
    212   1.1  pooka 		*sizep = size;
    213   1.1  pooka 	if (rv == 0 && ftp)
    214   1.1  pooka 		*ftp = ft;
    215  1.12  pooka 	if (fd != -1)
    216  1.12  pooka 		close(fd);
    217   1.1  pooka 
    218   1.1  pooka 	return rv;
    219   1.1  pooka }
    220   1.1  pooka 
    221   1.1  pooka int
    222   1.1  pooka rumpuser_nanosleep(uint64_t *sec, uint64_t *nsec, int *error)
    223   1.1  pooka {
    224   1.1  pooka 	struct timespec rqt, rmt;
    225   1.1  pooka 	int rv;
    226   1.1  pooka 
    227   1.1  pooka 	/*LINTED*/
    228   1.1  pooka 	rqt.tv_sec = *sec;
    229   1.1  pooka 	/*LINTED*/
    230   1.1  pooka 	rqt.tv_nsec = *nsec;
    231   1.1  pooka 
    232   1.1  pooka 	KLOCK_WRAP(rv = nanosleep(&rqt, &rmt));
    233   1.1  pooka 	if (rv == -1)
    234  1.10  pooka 		seterror(errno);
    235   1.1  pooka 
    236   1.1  pooka 	*sec = rmt.tv_sec;
    237   1.1  pooka 	*nsec = rmt.tv_nsec;
    238   1.1  pooka 
    239   1.1  pooka 	return rv;
    240   1.1  pooka }
    241   1.1  pooka 
    242   1.1  pooka void *
    243   1.5  pooka rumpuser_malloc(size_t howmuch, int alignment)
    244   1.1  pooka {
    245   1.5  pooka 	void *mem;
    246   1.6  pooka 	int rv;
    247   1.5  pooka 
    248   1.5  pooka 	if (alignment == 0)
    249   1.5  pooka 		alignment = sizeof(void *);
    250   1.1  pooka 
    251  1.14  pooka 	rv = posix_memalign(&mem, (size_t)alignment, howmuch);
    252   1.6  pooka 	if (__predict_false(rv != 0)) {
    253   1.6  pooka 		if (rv == EINVAL) {
    254   1.6  pooka 			printf("rumpuser_malloc: invalid alignment %d\n",
    255   1.6  pooka 			    alignment);
    256   1.6  pooka 			abort();
    257   1.6  pooka 		}
    258   1.6  pooka 		mem = NULL;
    259   1.6  pooka 	}
    260   1.1  pooka 
    261   1.5  pooka 	return mem;
    262   1.1  pooka }
    263   1.1  pooka 
    264  1.32  pooka /*ARGSUSED1*/
    265   1.1  pooka void
    266  1.32  pooka rumpuser_free(void *ptr, size_t size)
    267   1.1  pooka {
    268   1.1  pooka 
    269   1.1  pooka 	free(ptr);
    270   1.1  pooka }
    271   1.1  pooka 
    272   1.1  pooka void *
    273   1.7  pooka rumpuser_anonmmap(void *prefaddr, size_t size, int alignbit,
    274   1.7  pooka 	int exec, int *error)
    275   1.1  pooka {
    276   1.1  pooka 	void *rv;
    277   1.1  pooka 	int prot;
    278   1.1  pooka 
    279  1.18  pooka #ifndef MAP_ALIGNED
    280  1.18  pooka #define MAP_ALIGNED(a) 0
    281  1.18  pooka 	if (alignbit)
    282  1.18  pooka 		fprintf(stderr, "rumpuser_anonmmap: warning, requested "
    283  1.18  pooka 		    "alignment not supported by hypervisor\n");
    284  1.18  pooka #endif
    285  1.18  pooka 
    286   1.1  pooka 	prot = PROT_READ|PROT_WRITE;
    287   1.1  pooka 	if (exec)
    288   1.1  pooka 		prot |= PROT_EXEC;
    289   1.7  pooka 	rv = mmap(prefaddr, size, prot,
    290  1.24  pooka 	    MAP_PRIVATE | MAP_ANON | MAP_ALIGNED(alignbit), -1, 0);
    291   1.1  pooka 	if (rv == MAP_FAILED) {
    292  1.10  pooka 		seterror(errno);
    293   1.1  pooka 		return NULL;
    294   1.1  pooka 	}
    295   1.1  pooka 	return rv;
    296   1.1  pooka }
    297   1.1  pooka 
    298   1.1  pooka void
    299   1.1  pooka rumpuser_unmap(void *addr, size_t len)
    300   1.1  pooka {
    301   1.1  pooka 	int rv;
    302   1.1  pooka 
    303   1.1  pooka 	rv = munmap(addr, len);
    304   1.1  pooka 	assert(rv == 0);
    305   1.1  pooka }
    306   1.1  pooka 
    307   1.1  pooka void *
    308   1.1  pooka rumpuser_filemmap(int fd, off_t offset, size_t len, int flags, int *error)
    309   1.1  pooka {
    310   1.1  pooka 	void *rv;
    311   1.1  pooka 	int mmflags, prot;
    312   1.1  pooka 
    313  1.22  pooka 	if (flags & RUMPUSER_FILEMMAP_TRUNCATE) {
    314  1.22  pooka 		if (ftruncate(fd, offset + len) == -1) {
    315  1.22  pooka 			seterror(errno);
    316  1.22  pooka 			return NULL;
    317  1.22  pooka 		}
    318  1.22  pooka 	}
    319   1.1  pooka 
    320  1.23  pooka /* it's implicit */
    321  1.23  pooka #if defined(__sun__) && !defined(MAP_FILE)
    322  1.23  pooka #define MAP_FILE 0
    323  1.23  pooka #endif
    324  1.23  pooka 
    325   1.1  pooka 	mmflags = MAP_FILE;
    326   1.1  pooka 	if (flags & RUMPUSER_FILEMMAP_SHARED)
    327   1.1  pooka 		mmflags |= MAP_SHARED;
    328   1.1  pooka 	else
    329   1.1  pooka 		mmflags |= MAP_PRIVATE;
    330   1.1  pooka 
    331   1.1  pooka 	prot = 0;
    332   1.1  pooka 	if (flags & RUMPUSER_FILEMMAP_READ)
    333   1.1  pooka 		prot |= PROT_READ;
    334   1.1  pooka 	if (flags & RUMPUSER_FILEMMAP_WRITE)
    335   1.1  pooka 		prot |= PROT_WRITE;
    336   1.1  pooka 
    337   1.1  pooka 	rv = mmap(NULL, len, PROT_READ|PROT_WRITE, mmflags, fd, offset);
    338   1.1  pooka 	if (rv == MAP_FAILED) {
    339  1.10  pooka 		seterror(errno);
    340   1.1  pooka 		return NULL;
    341   1.1  pooka 	}
    342   1.1  pooka 
    343  1.10  pooka 	seterror(0);
    344   1.1  pooka 	return rv;
    345   1.1  pooka }
    346   1.1  pooka 
    347   1.1  pooka int
    348   1.1  pooka rumpuser_memsync(void *addr, size_t len, int *error)
    349   1.1  pooka {
    350   1.1  pooka 
    351   1.1  pooka 	DOCALL_KLOCK(int, (msync(addr, len, MS_SYNC)));
    352   1.1  pooka }
    353   1.1  pooka 
    354   1.1  pooka int
    355  1.20  pooka rumpuser_open(const char *path, int ruflags, int *error)
    356   1.1  pooka {
    357  1.20  pooka 	int flags;
    358   1.1  pooka 
    359  1.20  pooka 	switch (ruflags & RUMPUSER_OPEN_ACCMODE) {
    360  1.20  pooka 	case RUMPUSER_OPEN_RDONLY:
    361  1.20  pooka 		flags = O_RDONLY;
    362  1.20  pooka 		break;
    363  1.20  pooka 	case RUMPUSER_OPEN_WRONLY:
    364  1.20  pooka 		flags = O_WRONLY;
    365  1.20  pooka 		break;
    366  1.20  pooka 	case RUMPUSER_OPEN_RDWR:
    367  1.20  pooka 		flags = O_RDWR;
    368  1.20  pooka 		break;
    369  1.20  pooka 	default:
    370  1.20  pooka 		*error = EINVAL;
    371  1.20  pooka 		return -1;
    372  1.20  pooka 	}
    373  1.20  pooka 
    374  1.20  pooka #define TESTSET(_ru_, _h_) if (ruflags & _ru_) flags |= _h_;
    375  1.20  pooka 	TESTSET(RUMPUSER_OPEN_CREATE, O_CREAT);
    376  1.20  pooka 	TESTSET(RUMPUSER_OPEN_EXCL, O_EXCL);
    377  1.23  pooka #ifdef O_DIRECT
    378  1.20  pooka 	TESTSET(RUMPUSER_OPEN_DIRECT, O_DIRECT);
    379  1.23  pooka #else
    380  1.23  pooka 	if (ruflags & RUMPUSER_OPEN_DIRECT) {
    381  1.23  pooka 		*error = EOPNOTSUPP;
    382  1.23  pooka 		return -1;
    383  1.23  pooka 	}
    384  1.23  pooka #endif
    385  1.20  pooka #undef TESTSET
    386  1.20  pooka 
    387  1.20  pooka 	DOCALL_KLOCK(int, (open(path, flags, 0644)));
    388   1.1  pooka }
    389   1.1  pooka 
    390   1.1  pooka int
    391   1.1  pooka rumpuser_ioctl(int fd, u_long cmd, void *data, int *error)
    392   1.1  pooka {
    393   1.1  pooka 
    394   1.1  pooka 	DOCALL_KLOCK(int, (ioctl(fd, cmd, data)));
    395   1.1  pooka }
    396   1.1  pooka 
    397   1.1  pooka int
    398   1.1  pooka rumpuser_close(int fd, int *error)
    399   1.1  pooka {
    400   1.1  pooka 
    401   1.1  pooka 	DOCALL(int, close(fd));
    402   1.1  pooka }
    403   1.1  pooka 
    404   1.1  pooka int
    405   1.1  pooka rumpuser_fsync(int fd, int *error)
    406   1.1  pooka {
    407   1.1  pooka 
    408   1.1  pooka 	DOCALL_KLOCK(int, fsync(fd));
    409   1.1  pooka }
    410   1.1  pooka 
    411   1.1  pooka ssize_t
    412   1.1  pooka rumpuser_read(int fd, void *data, size_t size, int *error)
    413   1.1  pooka {
    414   1.1  pooka 	ssize_t rv;
    415   1.1  pooka 
    416   1.1  pooka 	KLOCK_WRAP(rv = read(fd, data, size));
    417   1.1  pooka 	if (rv == -1)
    418  1.10  pooka 		seterror(errno);
    419   1.1  pooka 
    420   1.1  pooka 	return rv;
    421   1.1  pooka }
    422   1.1  pooka 
    423   1.1  pooka ssize_t
    424   1.1  pooka rumpuser_pread(int fd, void *data, size_t size, off_t offset, int *error)
    425   1.1  pooka {
    426   1.1  pooka 	ssize_t rv;
    427   1.1  pooka 
    428   1.1  pooka 	KLOCK_WRAP(rv = pread(fd, data, size, offset));
    429   1.1  pooka 	if (rv == -1)
    430  1.10  pooka 		seterror(errno);
    431   1.1  pooka 
    432   1.1  pooka 	return rv;
    433   1.1  pooka }
    434   1.1  pooka 
    435   1.1  pooka void
    436   1.1  pooka rumpuser_read_bio(int fd, void *data, size_t size, off_t offset,
    437   1.1  pooka 	rump_biodone_fn biodone, void *biodonecookie)
    438   1.1  pooka {
    439   1.1  pooka 	ssize_t rv;
    440   1.1  pooka 	int error = 0;
    441   1.1  pooka 
    442   1.1  pooka 	rv = rumpuser_pread(fd, data, size, offset, &error);
    443   1.1  pooka 	/* check against <0 instead of ==-1 to get typing below right */
    444   1.1  pooka 	if (rv < 0)
    445   1.1  pooka 		rv = 0;
    446   1.1  pooka 
    447   1.1  pooka 	/* LINTED: see above */
    448   1.1  pooka 	biodone(biodonecookie, rv, error);
    449   1.1  pooka }
    450   1.1  pooka 
    451   1.1  pooka ssize_t
    452   1.1  pooka rumpuser_write(int fd, const void *data, size_t size, int *error)
    453   1.1  pooka {
    454   1.1  pooka 	ssize_t rv;
    455   1.1  pooka 
    456   1.1  pooka 	KLOCK_WRAP(rv = write(fd, data, size));
    457   1.1  pooka 	if (rv == -1)
    458  1.10  pooka 		seterror(errno);
    459   1.1  pooka 
    460   1.1  pooka 	return rv;
    461   1.1  pooka }
    462   1.1  pooka 
    463   1.1  pooka ssize_t
    464   1.1  pooka rumpuser_pwrite(int fd, const void *data, size_t size, off_t offset, int *error)
    465   1.1  pooka {
    466   1.1  pooka 	ssize_t rv;
    467   1.1  pooka 
    468   1.1  pooka 	KLOCK_WRAP(rv = pwrite(fd, data, size, offset));
    469   1.1  pooka 	if (rv == -1)
    470  1.10  pooka 		seterror(errno);
    471   1.1  pooka 
    472   1.1  pooka 	return rv;
    473   1.1  pooka }
    474   1.1  pooka 
    475   1.1  pooka void
    476   1.1  pooka rumpuser_write_bio(int fd, const void *data, size_t size, off_t offset,
    477   1.1  pooka 	rump_biodone_fn biodone, void *biodonecookie)
    478   1.1  pooka {
    479   1.1  pooka 	ssize_t rv;
    480   1.1  pooka 	int error = 0;
    481   1.1  pooka 
    482   1.1  pooka 	rv = rumpuser_pwrite(fd, data, size, offset, &error);
    483   1.1  pooka 	/* check against <0 instead of ==-1 to get typing below right */
    484   1.1  pooka 	if (rv < 0)
    485   1.1  pooka 		rv = 0;
    486   1.1  pooka 
    487   1.1  pooka 	/* LINTED: see above */
    488   1.1  pooka 	biodone(biodonecookie, rv, error);
    489   1.1  pooka }
    490   1.1  pooka 
    491   1.1  pooka ssize_t
    492   1.1  pooka rumpuser_readv(int fd, const struct rumpuser_iovec *riov, int iovcnt,
    493   1.1  pooka 	int *error)
    494   1.1  pooka {
    495   1.1  pooka 	struct iovec *iovp;
    496   1.1  pooka 	ssize_t rv;
    497   1.1  pooka 	int i;
    498   1.1  pooka 
    499   1.1  pooka 	iovp = malloc(iovcnt * sizeof(struct iovec));
    500   1.1  pooka 	if (iovp == NULL) {
    501  1.10  pooka 		seterror(ENOMEM);
    502   1.1  pooka 		return -1;
    503   1.1  pooka 	}
    504   1.1  pooka 	for (i = 0; i < iovcnt; i++) {
    505   1.1  pooka 		iovp[i].iov_base = riov[i].iov_base;
    506   1.1  pooka 		/*LINTED*/
    507   1.1  pooka 		iovp[i].iov_len = riov[i].iov_len;
    508   1.1  pooka 	}
    509   1.1  pooka 
    510   1.1  pooka 	KLOCK_WRAP(rv = readv(fd, iovp, iovcnt));
    511   1.1  pooka 	if (rv == -1)
    512  1.10  pooka 		seterror(errno);
    513   1.1  pooka 	free(iovp);
    514   1.1  pooka 
    515   1.1  pooka 	return rv;
    516   1.1  pooka }
    517   1.1  pooka 
    518   1.1  pooka ssize_t
    519   1.1  pooka rumpuser_writev(int fd, const struct rumpuser_iovec *riov, int iovcnt,
    520   1.1  pooka 	int *error)
    521   1.1  pooka {
    522   1.1  pooka 	struct iovec *iovp;
    523   1.1  pooka 	ssize_t rv;
    524   1.1  pooka 	int i;
    525   1.1  pooka 
    526   1.1  pooka 	iovp = malloc(iovcnt * sizeof(struct iovec));
    527   1.1  pooka 	if (iovp == NULL) {
    528  1.10  pooka 		seterror(ENOMEM);
    529   1.1  pooka 		return -1;
    530   1.1  pooka 	}
    531   1.1  pooka 	for (i = 0; i < iovcnt; i++) {
    532   1.1  pooka 		iovp[i].iov_base = riov[i].iov_base;
    533   1.1  pooka 		/*LINTED*/
    534   1.1  pooka 		iovp[i].iov_len = riov[i].iov_len;
    535   1.1  pooka 	}
    536   1.1  pooka 
    537   1.1  pooka 	KLOCK_WRAP(rv = writev(fd, iovp, iovcnt));
    538   1.1  pooka 	if (rv == -1)
    539  1.10  pooka 		seterror(errno);
    540   1.1  pooka 	free(iovp);
    541   1.1  pooka 
    542   1.1  pooka 	return rv;
    543   1.1  pooka }
    544   1.1  pooka 
    545   1.1  pooka int
    546   1.1  pooka rumpuser_gettime(uint64_t *sec, uint64_t *nsec, int *error)
    547   1.1  pooka {
    548   1.1  pooka 	struct timeval tv;
    549   1.1  pooka 	int rv;
    550   1.1  pooka 
    551   1.1  pooka 	rv = gettimeofday(&tv, NULL);
    552   1.1  pooka 	if (rv == -1) {
    553  1.10  pooka 		seterror(errno);
    554   1.1  pooka 		return rv;
    555   1.1  pooka 	}
    556   1.1  pooka 
    557   1.1  pooka 	*sec = tv.tv_sec;
    558   1.1  pooka 	*nsec = tv.tv_usec * 1000;
    559   1.1  pooka 
    560   1.1  pooka 	return 0;
    561   1.1  pooka }
    562   1.1  pooka 
    563   1.1  pooka int
    564   1.1  pooka rumpuser_getenv(const char *name, char *buf, size_t blen, int *error)
    565   1.1  pooka {
    566   1.1  pooka 
    567   1.1  pooka 	DOCALL(int, getenv_r(name, buf, blen));
    568   1.1  pooka }
    569   1.1  pooka 
    570   1.1  pooka int
    571   1.1  pooka rumpuser_gethostname(char *name, size_t namelen, int *error)
    572   1.1  pooka {
    573  1.13  pooka 	char tmp[MAXHOSTNAMELEN];
    574   1.1  pooka 
    575  1.13  pooka 	if (gethostname(tmp, sizeof(tmp)) == -1) {
    576  1.23  pooka 		snprintf(name, namelen, "rump-%05d.rumpdomain", (int)getpid());
    577  1.13  pooka 	} else {
    578  1.13  pooka 		snprintf(name, namelen, "rump-%05d.%s.rumpdomain",
    579  1.23  pooka 		    (int)getpid(), tmp);
    580  1.13  pooka 	}
    581  1.13  pooka 
    582  1.13  pooka 	*error = 0;
    583  1.13  pooka 	return 0;
    584   1.1  pooka }
    585   1.1  pooka 
    586   1.1  pooka int
    587   1.1  pooka rumpuser_putchar(int c, int *error)
    588   1.1  pooka {
    589   1.1  pooka 
    590   1.1  pooka 	DOCALL(int, (putchar(c)));
    591   1.1  pooka }
    592   1.1  pooka 
    593   1.1  pooka void
    594   1.1  pooka rumpuser_exit(int rv)
    595   1.1  pooka {
    596   1.1  pooka 
    597   1.1  pooka 	if (rv == RUMPUSER_PANIC)
    598   1.1  pooka 		abort();
    599   1.1  pooka 	else
    600   1.1  pooka 		exit(rv);
    601   1.1  pooka }
    602   1.1  pooka 
    603   1.1  pooka void
    604   1.1  pooka rumpuser_seterrno(int error)
    605   1.1  pooka {
    606   1.1  pooka 
    607   1.1  pooka 	errno = error;
    608   1.1  pooka }
    609   1.1  pooka 
    610  1.21  pooka /*
    611  1.21  pooka  * On NetBSD we use kqueue, on Linux we use inotify.  The underlying
    612  1.21  pooka  * interface requirements aren't quite the same, but we have a very
    613  1.21  pooka  * good chance of doing the fd->path mapping on Linux thanks to dcache,
    614  1.21  pooka  * so just keep the existing interfaces for now.
    615  1.21  pooka  */
    616  1.21  pooka #if defined(__NetBSD__)
    617   1.1  pooka int
    618   1.1  pooka rumpuser_writewatchfile_setup(int kq, int fd, intptr_t opaque, int *error)
    619   1.1  pooka {
    620   1.1  pooka 	struct kevent kev;
    621   1.1  pooka 
    622   1.1  pooka 	if (kq == -1) {
    623   1.1  pooka 		kq = kqueue();
    624   1.1  pooka 		if (kq == -1) {
    625  1.10  pooka 			seterror(errno);
    626   1.1  pooka 			return -1;
    627   1.1  pooka 		}
    628   1.1  pooka 	}
    629   1.1  pooka 
    630   1.1  pooka 	EV_SET(&kev, fd, EVFILT_VNODE, EV_ADD|EV_ENABLE|EV_CLEAR,
    631   1.1  pooka 	    NOTE_WRITE, 0, opaque);
    632   1.1  pooka 	if (kevent(kq, &kev, 1, NULL, 0, NULL) == -1) {
    633  1.10  pooka 		seterror(errno);
    634   1.1  pooka 		return -1;
    635   1.1  pooka 	}
    636   1.1  pooka 
    637   1.1  pooka 	return kq;
    638   1.1  pooka }
    639   1.1  pooka 
    640   1.1  pooka int
    641   1.1  pooka rumpuser_writewatchfile_wait(int kq, intptr_t *opaque, int *error)
    642   1.1  pooka {
    643   1.1  pooka 	struct kevent kev;
    644   1.1  pooka 	int rv;
    645   1.1  pooka 
    646   1.9  pooka  again:
    647   1.1  pooka 	KLOCK_WRAP(rv = kevent(kq, NULL, 0, &kev, 1, NULL));
    648   1.1  pooka 	if (rv == -1) {
    649   1.9  pooka 		if (errno == EINTR)
    650   1.9  pooka 			goto again;
    651  1.10  pooka 		seterror(errno);
    652   1.1  pooka 		return -1;
    653   1.1  pooka 	}
    654   1.1  pooka 
    655   1.1  pooka 	if (opaque)
    656   1.1  pooka 		*opaque = kev.udata;
    657   1.1  pooka 	return rv;
    658   1.1  pooka }
    659  1.21  pooka 
    660  1.21  pooka #elif defined(__linux__)
    661  1.21  pooka #include <sys/inotify.h>
    662  1.21  pooka 
    663  1.21  pooka int
    664  1.21  pooka rumpuser_writewatchfile_setup(int inotify, int fd, intptr_t notused, int *error)
    665  1.21  pooka {
    666  1.21  pooka 	char procbuf[PATH_MAX], linkbuf[PATH_MAX];
    667  1.21  pooka 	ssize_t nn;
    668  1.21  pooka 
    669  1.21  pooka 	if (inotify == -1) {
    670  1.21  pooka 		inotify = inotify_init();
    671  1.21  pooka 		if (inotify == -1) {
    672  1.21  pooka 			seterror(errno);
    673  1.21  pooka 			return -1;
    674  1.21  pooka 		}
    675  1.21  pooka 	}
    676  1.21  pooka 
    677  1.21  pooka 	/* ok, need to map fd into path for inotify */
    678  1.21  pooka 	snprintf(procbuf, sizeof(procbuf), "/proc/self/fd/%d", fd);
    679  1.29  pooka 	nn = readlink(procbuf, linkbuf, sizeof(linkbuf)-1);
    680  1.29  pooka 	if (nn >= (ssize_t)sizeof(linkbuf)-1) {
    681  1.21  pooka 		nn = -1;
    682  1.21  pooka 		errno = E2BIG; /* pick something */
    683  1.21  pooka 	}
    684  1.21  pooka 	if (nn == -1) {
    685  1.21  pooka 		seterror(errno);
    686  1.21  pooka 		close(inotify);
    687  1.21  pooka 		return -1;
    688  1.21  pooka 	}
    689  1.21  pooka 
    690  1.29  pooka 	linkbuf[nn] = '\0';
    691  1.21  pooka 	if (inotify_add_watch(inotify, linkbuf, IN_MODIFY) == -1) {
    692  1.21  pooka 		seterror(errno);
    693  1.21  pooka 		close(inotify);
    694  1.21  pooka 		return -1;
    695  1.21  pooka 	}
    696  1.21  pooka 
    697  1.21  pooka 	return inotify;
    698  1.21  pooka }
    699  1.21  pooka 
    700  1.21  pooka int
    701  1.21  pooka rumpuser_writewatchfile_wait(int kq, intptr_t *opaque, int *error)
    702  1.21  pooka {
    703  1.21  pooka 	struct inotify_event iev;
    704  1.21  pooka 	ssize_t nn;
    705  1.21  pooka 
    706  1.21  pooka 	do {
    707  1.21  pooka 		KLOCK_WRAP(nn = read(kq, &iev, sizeof(iev)));
    708  1.21  pooka 	} while (errno == EINTR);
    709  1.21  pooka 
    710  1.21  pooka 	if (nn == -1) {
    711  1.21  pooka 		seterror(errno);
    712  1.21  pooka 		return -1;
    713  1.21  pooka 	}
    714  1.21  pooka 	return (nn/sizeof(iev));
    715  1.21  pooka }
    716  1.26  pooka 
    717  1.26  pooka #else
    718  1.26  pooka 
    719  1.26  pooka /* a polling default implementation */
    720  1.26  pooka int
    721  1.26  pooka rumpuser_writewatchfile_setup(int inotify, int fd, intptr_t notused, int *error)
    722  1.26  pooka {
    723  1.26  pooka 	static int warned = 0;
    724  1.26  pooka 
    725  1.26  pooka 	if (!warned) {
    726  1.27  pooka 		fprintf(stderr, "WARNING: rumpuser writewatchfile routines are "
    727  1.26  pooka 		    "polling-only on this platform\n");
    728  1.26  pooka 		warned = 1;
    729  1.26  pooka 	}
    730  1.26  pooka 
    731  1.26  pooka 	return 0;
    732  1.26  pooka }
    733  1.26  pooka 
    734  1.26  pooka int
    735  1.26  pooka rumpuser_writewatchfile_wait(int kq, intptr_t *opaque, int *error)
    736  1.26  pooka {
    737  1.26  pooka 
    738  1.26  pooka 	KLOCK_WRAP(usleep(10000));
    739  1.26  pooka 	return 0;
    740  1.26  pooka }
    741  1.18  pooka #endif
    742   1.1  pooka 
    743   1.1  pooka /*
    744   1.1  pooka  * This is meant for safe debugging prints from the kernel.
    745   1.1  pooka  */
    746   1.1  pooka int
    747   1.1  pooka rumpuser_dprintf(const char *format, ...)
    748   1.1  pooka {
    749   1.1  pooka 	va_list ap;
    750   1.1  pooka 	int rv;
    751   1.1  pooka 
    752   1.1  pooka 	va_start(ap, format);
    753   1.9  pooka 	rv = vfprintf(stderr, format, ap);
    754   1.1  pooka 	va_end(ap);
    755   1.1  pooka 
    756   1.1  pooka 	return rv;
    757   1.1  pooka }
    758   1.2  pooka 
    759   1.2  pooka int
    760   1.2  pooka rumpuser_kill(int64_t pid, int sig, int *error)
    761   1.2  pooka {
    762   1.2  pooka 
    763   1.3  pooka #ifdef __NetBSD__
    764   1.2  pooka 	if (pid == RUMPUSER_PID_SELF) {
    765   1.2  pooka 		DOCALL(int, raise(sig));
    766   1.2  pooka 	} else {
    767   1.2  pooka 		DOCALL(int, kill((pid_t)pid, sig));
    768   1.2  pooka 	}
    769   1.3  pooka #else
    770   1.3  pooka 	/* XXXfixme: signal numbers may not match on non-NetBSD */
    771  1.10  pooka 	seterror(EOPNOTSUPP);
    772   1.3  pooka 	return -1;
    773   1.3  pooka #endif
    774   1.2  pooka }
    775   1.4  pooka 
    776   1.4  pooka int
    777   1.4  pooka rumpuser_getnhostcpu(void)
    778   1.4  pooka {
    779  1.18  pooka 	int ncpu = 1;
    780  1.18  pooka 
    781  1.25  pooka #if defined(__NetBSD__) || defined(__FreeBSD__) || defined(__DragonFly__)
    782   1.4  pooka 	size_t sz = sizeof(ncpu);
    783   1.4  pooka 
    784  1.18  pooka 	sysctlbyname("hw.ncpu", &ncpu, &sz, NULL, 0);
    785  1.28  pooka #elif defined(__linux__) || defined(__CYGWIN__)
    786  1.18  pooka 	FILE *fp;
    787  1.18  pooka 	char *line = NULL;
    788  1.18  pooka 	size_t n = 0;
    789  1.18  pooka 
    790  1.18  pooka 	/* If anyone knows a better way, I'm all ears */
    791  1.18  pooka 	if ((fp = fopen("/proc/cpuinfo", "r")) != NULL) {
    792  1.18  pooka 		ncpu = 0;
    793  1.18  pooka 		while (getline(&line, &n, fp) != -1) {
    794  1.18  pooka 			if (strncmp(line,
    795  1.18  pooka 			    "processor", sizeof("processor")-1) == 0)
    796  1.18  pooka 			    	ncpu++;
    797  1.18  pooka 		}
    798  1.18  pooka 		if (ncpu == 0)
    799  1.18  pooka 			ncpu = 1;
    800  1.18  pooka 		free(line);
    801  1.18  pooka 		fclose(fp);
    802  1.18  pooka 	}
    803  1.23  pooka #elif __sun__
    804  1.23  pooka 	/* XXX: this is just a rough estimate ... */
    805  1.23  pooka 	ncpu = sysconf(_SC_NPROCESSORS_ONLN);
    806  1.18  pooka #endif
    807  1.18  pooka 
    808   1.4  pooka 	return ncpu;
    809   1.4  pooka }
    810  1.16    tls 
    811  1.33  pooka size_t
    812  1.33  pooka rumpuser_getrandom(void *buf, size_t buflen, int flags)
    813  1.16    tls {
    814  1.33  pooka 	size_t origlen = buflen;
    815  1.33  pooka 	uint32_t *p = buf;
    816  1.33  pooka 	uint32_t tmp;
    817  1.33  pooka 	int chunk;
    818  1.18  pooka 
    819  1.33  pooka 	do {
    820  1.33  pooka 		chunk = buflen < 4 ? buflen : 4; /* portable MIN ... */
    821  1.33  pooka 		tmp = RUMPUSER_RANDOM();
    822  1.33  pooka 		memcpy(p, &tmp, chunk);
    823  1.33  pooka 		p++;
    824  1.33  pooka 		buflen -= chunk;
    825  1.33  pooka 	} while (chunk);
    826  1.33  pooka 
    827  1.33  pooka 	return origlen;
    828  1.16    tls }
    829