Home | History | Annotate | Line # | Download | only in librumpuser
rumpuser.c revision 1.15.4.3
      1  1.15.4.3   yamt /*	$NetBSD: rumpuser.c,v 1.15.4.3 2013/01/16 05:32:28 yamt Exp $	*/
      2       1.1  pooka 
      3       1.1  pooka /*
      4       1.1  pooka  * Copyright (c) 2007-2010 Antti Kantee.  All Rights Reserved.
      5       1.1  pooka  *
      6       1.1  pooka  * Redistribution and use in source and binary forms, with or without
      7       1.1  pooka  * modification, are permitted provided that the following conditions
      8       1.1  pooka  * are met:
      9       1.1  pooka  * 1. Redistributions of source code must retain the above copyright
     10       1.1  pooka  *    notice, this list of conditions and the following disclaimer.
     11       1.1  pooka  * 2. Redistributions in binary form must reproduce the above copyright
     12       1.1  pooka  *    notice, this list of conditions and the following disclaimer in the
     13       1.1  pooka  *    documentation and/or other materials provided with the distribution.
     14       1.1  pooka  *
     15       1.1  pooka  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
     16       1.1  pooka  * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
     17       1.1  pooka  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
     18       1.1  pooka  * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     19       1.1  pooka  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     20       1.1  pooka  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
     21       1.1  pooka  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     22       1.1  pooka  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     23       1.1  pooka  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     24       1.1  pooka  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     25       1.1  pooka  * SUCH DAMAGE.
     26       1.1  pooka  */
     27       1.1  pooka 
     28  1.15.4.2   yamt #include "rumpuser_port.h"
     29  1.15.4.2   yamt 
     30       1.1  pooka #if !defined(lint)
     31  1.15.4.3   yamt __RCSID("$NetBSD: rumpuser.c,v 1.15.4.3 2013/01/16 05:32:28 yamt Exp $");
     32       1.1  pooka #endif /* !lint */
     33       1.1  pooka 
     34       1.1  pooka #include <sys/ioctl.h>
     35       1.1  pooka #include <sys/mman.h>
     36       1.1  pooka #include <sys/uio.h>
     37  1.15.4.2   yamt #include <sys/stat.h>
     38  1.15.4.2   yamt #include <sys/time.h>
     39       1.1  pooka 
     40       1.1  pooka #ifdef __NetBSD__
     41      1.15  pooka #include <sys/disk.h>
     42       1.1  pooka #include <sys/disklabel.h>
     43      1.15  pooka #include <sys/dkio.h>
     44       1.4  pooka #include <sys/sysctl.h>
     45  1.15.4.2   yamt #include <sys/event.h>
     46       1.1  pooka #endif
     47       1.1  pooka 
     48       1.1  pooka #include <assert.h>
     49       1.1  pooka #include <errno.h>
     50       1.1  pooka #include <fcntl.h>
     51  1.15.4.3   yamt #include <netdb.h>
     52       1.1  pooka #include <poll.h>
     53       1.2  pooka #include <signal.h>
     54       1.1  pooka #include <stdarg.h>
     55       1.1  pooka #include <stdint.h>
     56       1.1  pooka #include <stdio.h>
     57       1.1  pooka #include <stdlib.h>
     58       1.1  pooka #include <string.h>
     59       1.1  pooka #include <time.h>
     60       1.1  pooka #include <unistd.h>
     61       1.1  pooka 
     62       1.1  pooka #include <rump/rumpuser.h>
     63       1.1  pooka 
     64       1.1  pooka #include "rumpuser_int.h"
     65       1.1  pooka 
     66       1.1  pooka int
     67  1.15.4.2   yamt rumpuser_getversion(void)
     68       1.8  pooka {
     69       1.8  pooka 
     70       1.8  pooka 	return RUMPUSER_VERSION;
     71       1.8  pooka }
     72       1.8  pooka 
     73       1.8  pooka int
     74       1.1  pooka rumpuser_getfileinfo(const char *path, uint64_t *sizep, int *ftp, int *error)
     75       1.1  pooka {
     76       1.1  pooka 	struct stat sb;
     77       1.1  pooka 	uint64_t size;
     78       1.1  pooka 	int needsdev = 0, rv = 0, ft;
     79      1.12  pooka 	int fd = -1;
     80       1.1  pooka 
     81       1.1  pooka 	if (stat(path, &sb) == -1) {
     82      1.10  pooka 		seterror(errno);
     83       1.1  pooka 		return -1;
     84       1.1  pooka 	}
     85       1.1  pooka 
     86       1.1  pooka 	switch (sb.st_mode & S_IFMT) {
     87       1.1  pooka 	case S_IFDIR:
     88       1.1  pooka 		ft = RUMPUSER_FT_DIR;
     89       1.1  pooka 		break;
     90       1.1  pooka 	case S_IFREG:
     91       1.1  pooka 		ft = RUMPUSER_FT_REG;
     92       1.1  pooka 		break;
     93       1.1  pooka 	case S_IFBLK:
     94       1.1  pooka 		ft = RUMPUSER_FT_BLK;
     95       1.1  pooka 		needsdev = 1;
     96       1.1  pooka 		break;
     97       1.1  pooka 	case S_IFCHR:
     98       1.1  pooka 		ft = RUMPUSER_FT_CHR;
     99       1.1  pooka 		needsdev = 1;
    100       1.1  pooka 		break;
    101       1.1  pooka 	default:
    102       1.1  pooka 		ft = RUMPUSER_FT_OTHER;
    103       1.1  pooka 		break;
    104       1.1  pooka 	}
    105       1.1  pooka 
    106       1.1  pooka 	if (!needsdev) {
    107       1.1  pooka 		size = sb.st_size;
    108       1.1  pooka 	} else if (sizep) {
    109       1.1  pooka 		/*
    110       1.1  pooka 		 * Welcome to the jungle.  Of course querying the kernel
    111       1.1  pooka 		 * for a device partition size is supposed to be far from
    112       1.1  pooka 		 * trivial.  On NetBSD we use ioctl.  On $other platform
    113       1.1  pooka 		 * we have a problem.  We try "the lseek trick" and just
    114       1.1  pooka 		 * fail if that fails.  Platform specific code can later
    115       1.1  pooka 		 * be written here if appropriate.
    116       1.1  pooka 		 *
    117       1.1  pooka 		 * On NetBSD we hope and pray that for block devices nobody
    118       1.1  pooka 		 * else is holding them open, because otherwise the kernel
    119       1.1  pooka 		 * will not permit us to open it.  Thankfully, this is
    120       1.1  pooka 		 * usually called only in bootstrap and then we can
    121       1.1  pooka 		 * forget about it.
    122       1.1  pooka 		 */
    123       1.1  pooka #ifndef __NetBSD__
    124       1.1  pooka 		off_t off;
    125       1.1  pooka 
    126       1.1  pooka 		fd = open(path, O_RDONLY);
    127       1.1  pooka 		if (fd == -1) {
    128      1.10  pooka 			seterror(errno);
    129       1.1  pooka 			rv = -1;
    130       1.1  pooka 			goto out;
    131       1.1  pooka 		}
    132       1.1  pooka 
    133       1.1  pooka 		off = lseek(fd, 0, SEEK_END);
    134       1.1  pooka 		if (off != 0) {
    135       1.1  pooka 			size = off;
    136       1.1  pooka 			goto out;
    137       1.1  pooka 		}
    138       1.1  pooka 		fprintf(stderr, "error: device size query not implemented on "
    139       1.1  pooka 		    "this platform\n");
    140      1.12  pooka 		seterror(EOPNOTSUPP);
    141       1.1  pooka 		rv = -1;
    142       1.1  pooka 		goto out;
    143       1.1  pooka #else
    144       1.1  pooka 		struct disklabel lab;
    145       1.1  pooka 		struct partition *parta;
    146      1.15  pooka 		struct dkwedge_info dkw;
    147       1.1  pooka 
    148       1.1  pooka 		fd = open(path, O_RDONLY);
    149       1.1  pooka 		if (fd == -1) {
    150      1.10  pooka 			seterror(errno);
    151       1.1  pooka 			rv = -1;
    152       1.1  pooka 			goto out;
    153       1.1  pooka 		}
    154       1.1  pooka 
    155      1.15  pooka 		if (ioctl(fd, DIOCGDINFO, &lab) == 0) {
    156      1.15  pooka 			parta = &lab.d_partitions[DISKPART(sb.st_rdev)];
    157      1.15  pooka 			size = (uint64_t)lab.d_secsize * parta->p_size;
    158      1.15  pooka 			goto out;
    159      1.15  pooka 		}
    160      1.15  pooka 
    161      1.15  pooka 		if (ioctl(fd, DIOCGWEDGEINFO, &dkw) == 0) {
    162      1.15  pooka 			/*
    163      1.15  pooka 			 * XXX: should use DIOCGDISKINFO to query
    164      1.15  pooka 			 * sector size, but that requires proplib,
    165      1.15  pooka 			 * so just don't bother for now.  it's nice
    166      1.15  pooka 			 * that something as difficult as figuring out
    167      1.15  pooka 			 * a partition's size has been made so easy.
    168      1.15  pooka 			 */
    169      1.15  pooka 			size = dkw.dkw_size << DEV_BSHIFT;
    170       1.1  pooka 			goto out;
    171       1.1  pooka 		}
    172       1.1  pooka 
    173      1.15  pooka 		seterror(errno);
    174      1.15  pooka 		rv = -1;
    175       1.1  pooka #endif /* __NetBSD__ */
    176       1.1  pooka 	}
    177       1.1  pooka 
    178       1.1  pooka  out:
    179       1.1  pooka 	if (rv == 0 && sizep)
    180       1.1  pooka 		*sizep = size;
    181       1.1  pooka 	if (rv == 0 && ftp)
    182       1.1  pooka 		*ftp = ft;
    183      1.12  pooka 	if (fd != -1)
    184      1.12  pooka 		close(fd);
    185       1.1  pooka 
    186       1.1  pooka 	return rv;
    187       1.1  pooka }
    188       1.1  pooka 
    189       1.1  pooka int
    190       1.1  pooka rumpuser_nanosleep(uint64_t *sec, uint64_t *nsec, int *error)
    191       1.1  pooka {
    192       1.1  pooka 	struct timespec rqt, rmt;
    193       1.1  pooka 	int rv;
    194       1.1  pooka 
    195       1.1  pooka 	/*LINTED*/
    196       1.1  pooka 	rqt.tv_sec = *sec;
    197       1.1  pooka 	/*LINTED*/
    198       1.1  pooka 	rqt.tv_nsec = *nsec;
    199       1.1  pooka 
    200       1.1  pooka 	KLOCK_WRAP(rv = nanosleep(&rqt, &rmt));
    201       1.1  pooka 	if (rv == -1)
    202      1.10  pooka 		seterror(errno);
    203       1.1  pooka 
    204       1.1  pooka 	*sec = rmt.tv_sec;
    205       1.1  pooka 	*nsec = rmt.tv_nsec;
    206       1.1  pooka 
    207       1.1  pooka 	return rv;
    208       1.1  pooka }
    209       1.1  pooka 
    210       1.1  pooka void *
    211       1.5  pooka rumpuser_malloc(size_t howmuch, int alignment)
    212       1.1  pooka {
    213       1.5  pooka 	void *mem;
    214       1.6  pooka 	int rv;
    215       1.5  pooka 
    216       1.5  pooka 	if (alignment == 0)
    217       1.5  pooka 		alignment = sizeof(void *);
    218       1.1  pooka 
    219      1.14  pooka 	rv = posix_memalign(&mem, (size_t)alignment, howmuch);
    220       1.6  pooka 	if (__predict_false(rv != 0)) {
    221       1.6  pooka 		if (rv == EINVAL) {
    222       1.6  pooka 			printf("rumpuser_malloc: invalid alignment %d\n",
    223       1.6  pooka 			    alignment);
    224       1.6  pooka 			abort();
    225       1.6  pooka 		}
    226       1.6  pooka 		mem = NULL;
    227       1.6  pooka 	}
    228       1.1  pooka 
    229       1.5  pooka 	return mem;
    230       1.1  pooka }
    231       1.1  pooka 
    232       1.1  pooka void *
    233       1.5  pooka rumpuser_realloc(void *ptr, size_t howmuch)
    234       1.1  pooka {
    235       1.1  pooka 
    236       1.5  pooka 	return realloc(ptr, howmuch);
    237       1.1  pooka }
    238       1.1  pooka 
    239       1.1  pooka void
    240       1.1  pooka rumpuser_free(void *ptr)
    241       1.1  pooka {
    242       1.1  pooka 
    243       1.1  pooka 	free(ptr);
    244       1.1  pooka }
    245       1.1  pooka 
    246       1.1  pooka void *
    247       1.7  pooka rumpuser_anonmmap(void *prefaddr, size_t size, int alignbit,
    248       1.7  pooka 	int exec, int *error)
    249       1.1  pooka {
    250       1.1  pooka 	void *rv;
    251       1.1  pooka 	int prot;
    252       1.1  pooka 
    253  1.15.4.2   yamt #ifndef MAP_ALIGNED
    254  1.15.4.2   yamt #define MAP_ALIGNED(a) 0
    255  1.15.4.2   yamt 	if (alignbit)
    256  1.15.4.2   yamt 		fprintf(stderr, "rumpuser_anonmmap: warning, requested "
    257  1.15.4.2   yamt 		    "alignment not supported by hypervisor\n");
    258  1.15.4.2   yamt #endif
    259  1.15.4.2   yamt 
    260       1.1  pooka 	prot = PROT_READ|PROT_WRITE;
    261       1.1  pooka 	if (exec)
    262       1.1  pooka 		prot |= PROT_EXEC;
    263       1.7  pooka 	rv = mmap(prefaddr, size, prot,
    264  1.15.4.3   yamt 	    MAP_PRIVATE | MAP_ANON | MAP_ALIGNED(alignbit), -1, 0);
    265       1.1  pooka 	if (rv == MAP_FAILED) {
    266      1.10  pooka 		seterror(errno);
    267       1.1  pooka 		return NULL;
    268       1.1  pooka 	}
    269       1.1  pooka 	return rv;
    270       1.1  pooka }
    271       1.1  pooka 
    272       1.1  pooka void
    273       1.1  pooka rumpuser_unmap(void *addr, size_t len)
    274       1.1  pooka {
    275       1.1  pooka 	int rv;
    276       1.1  pooka 
    277       1.1  pooka 	rv = munmap(addr, len);
    278       1.1  pooka 	assert(rv == 0);
    279       1.1  pooka }
    280       1.1  pooka 
    281       1.1  pooka void *
    282       1.1  pooka rumpuser_filemmap(int fd, off_t offset, size_t len, int flags, int *error)
    283       1.1  pooka {
    284       1.1  pooka 	void *rv;
    285       1.1  pooka 	int mmflags, prot;
    286       1.1  pooka 
    287  1.15.4.3   yamt 	if (flags & RUMPUSER_FILEMMAP_TRUNCATE) {
    288  1.15.4.3   yamt 		if (ftruncate(fd, offset + len) == -1) {
    289  1.15.4.3   yamt 			seterror(errno);
    290  1.15.4.3   yamt 			return NULL;
    291  1.15.4.3   yamt 		}
    292  1.15.4.3   yamt 	}
    293  1.15.4.3   yamt 
    294  1.15.4.3   yamt /* it's implicit */
    295  1.15.4.3   yamt #if defined(__sun__) && !defined(MAP_FILE)
    296  1.15.4.3   yamt #define MAP_FILE 0
    297  1.15.4.3   yamt #endif
    298       1.1  pooka 
    299       1.1  pooka 	mmflags = MAP_FILE;
    300       1.1  pooka 	if (flags & RUMPUSER_FILEMMAP_SHARED)
    301       1.1  pooka 		mmflags |= MAP_SHARED;
    302       1.1  pooka 	else
    303       1.1  pooka 		mmflags |= MAP_PRIVATE;
    304       1.1  pooka 
    305       1.1  pooka 	prot = 0;
    306       1.1  pooka 	if (flags & RUMPUSER_FILEMMAP_READ)
    307       1.1  pooka 		prot |= PROT_READ;
    308       1.1  pooka 	if (flags & RUMPUSER_FILEMMAP_WRITE)
    309       1.1  pooka 		prot |= PROT_WRITE;
    310       1.1  pooka 
    311       1.1  pooka 	rv = mmap(NULL, len, PROT_READ|PROT_WRITE, mmflags, fd, offset);
    312       1.1  pooka 	if (rv == MAP_FAILED) {
    313      1.10  pooka 		seterror(errno);
    314       1.1  pooka 		return NULL;
    315       1.1  pooka 	}
    316       1.1  pooka 
    317      1.10  pooka 	seterror(0);
    318       1.1  pooka 	return rv;
    319       1.1  pooka }
    320       1.1  pooka 
    321       1.1  pooka int
    322       1.1  pooka rumpuser_memsync(void *addr, size_t len, int *error)
    323       1.1  pooka {
    324       1.1  pooka 
    325       1.1  pooka 	DOCALL_KLOCK(int, (msync(addr, len, MS_SYNC)));
    326       1.1  pooka }
    327       1.1  pooka 
    328       1.1  pooka int
    329  1.15.4.2   yamt rumpuser_open(const char *path, int ruflags, int *error)
    330       1.1  pooka {
    331  1.15.4.2   yamt 	int flags;
    332  1.15.4.2   yamt 
    333  1.15.4.2   yamt 	switch (ruflags & RUMPUSER_OPEN_ACCMODE) {
    334  1.15.4.2   yamt 	case RUMPUSER_OPEN_RDONLY:
    335  1.15.4.2   yamt 		flags = O_RDONLY;
    336  1.15.4.2   yamt 		break;
    337  1.15.4.2   yamt 	case RUMPUSER_OPEN_WRONLY:
    338  1.15.4.2   yamt 		flags = O_WRONLY;
    339  1.15.4.2   yamt 		break;
    340  1.15.4.2   yamt 	case RUMPUSER_OPEN_RDWR:
    341  1.15.4.2   yamt 		flags = O_RDWR;
    342  1.15.4.2   yamt 		break;
    343  1.15.4.2   yamt 	default:
    344  1.15.4.2   yamt 		*error = EINVAL;
    345  1.15.4.2   yamt 		return -1;
    346  1.15.4.2   yamt 	}
    347  1.15.4.2   yamt 
    348  1.15.4.2   yamt #define TESTSET(_ru_, _h_) if (ruflags & _ru_) flags |= _h_;
    349  1.15.4.2   yamt 	TESTSET(RUMPUSER_OPEN_CREATE, O_CREAT);
    350  1.15.4.2   yamt 	TESTSET(RUMPUSER_OPEN_EXCL, O_EXCL);
    351  1.15.4.3   yamt #ifdef O_DIRECT
    352  1.15.4.2   yamt 	TESTSET(RUMPUSER_OPEN_DIRECT, O_DIRECT);
    353  1.15.4.3   yamt #else
    354  1.15.4.3   yamt 	if (ruflags & RUMPUSER_OPEN_DIRECT) {
    355  1.15.4.3   yamt 		*error = EOPNOTSUPP;
    356  1.15.4.3   yamt 		return -1;
    357  1.15.4.3   yamt 	}
    358  1.15.4.3   yamt #endif
    359  1.15.4.2   yamt #undef TESTSET
    360       1.1  pooka 
    361  1.15.4.2   yamt 	DOCALL_KLOCK(int, (open(path, flags, 0644)));
    362       1.1  pooka }
    363       1.1  pooka 
    364       1.1  pooka int
    365       1.1  pooka rumpuser_ioctl(int fd, u_long cmd, void *data, int *error)
    366       1.1  pooka {
    367       1.1  pooka 
    368       1.1  pooka 	DOCALL_KLOCK(int, (ioctl(fd, cmd, data)));
    369       1.1  pooka }
    370       1.1  pooka 
    371       1.1  pooka int
    372       1.1  pooka rumpuser_close(int fd, int *error)
    373       1.1  pooka {
    374       1.1  pooka 
    375       1.1  pooka 	DOCALL(int, close(fd));
    376       1.1  pooka }
    377       1.1  pooka 
    378       1.1  pooka int
    379       1.1  pooka rumpuser_fsync(int fd, int *error)
    380       1.1  pooka {
    381       1.1  pooka 
    382       1.1  pooka 	DOCALL_KLOCK(int, fsync(fd));
    383       1.1  pooka }
    384       1.1  pooka 
    385       1.1  pooka ssize_t
    386       1.1  pooka rumpuser_read(int fd, void *data, size_t size, int *error)
    387       1.1  pooka {
    388       1.1  pooka 	ssize_t rv;
    389       1.1  pooka 
    390       1.1  pooka 	KLOCK_WRAP(rv = read(fd, data, size));
    391       1.1  pooka 	if (rv == -1)
    392      1.10  pooka 		seterror(errno);
    393       1.1  pooka 
    394       1.1  pooka 	return rv;
    395       1.1  pooka }
    396       1.1  pooka 
    397       1.1  pooka ssize_t
    398       1.1  pooka rumpuser_pread(int fd, void *data, size_t size, off_t offset, int *error)
    399       1.1  pooka {
    400       1.1  pooka 	ssize_t rv;
    401       1.1  pooka 
    402       1.1  pooka 	KLOCK_WRAP(rv = pread(fd, data, size, offset));
    403       1.1  pooka 	if (rv == -1)
    404      1.10  pooka 		seterror(errno);
    405       1.1  pooka 
    406       1.1  pooka 	return rv;
    407       1.1  pooka }
    408       1.1  pooka 
    409       1.1  pooka void
    410       1.1  pooka rumpuser_read_bio(int fd, void *data, size_t size, off_t offset,
    411       1.1  pooka 	rump_biodone_fn biodone, void *biodonecookie)
    412       1.1  pooka {
    413       1.1  pooka 	ssize_t rv;
    414       1.1  pooka 	int error = 0;
    415       1.1  pooka 
    416       1.1  pooka 	rv = rumpuser_pread(fd, data, size, offset, &error);
    417       1.1  pooka 	/* check against <0 instead of ==-1 to get typing below right */
    418       1.1  pooka 	if (rv < 0)
    419       1.1  pooka 		rv = 0;
    420       1.1  pooka 
    421       1.1  pooka 	/* LINTED: see above */
    422       1.1  pooka 	biodone(biodonecookie, rv, error);
    423       1.1  pooka }
    424       1.1  pooka 
    425       1.1  pooka ssize_t
    426       1.1  pooka rumpuser_write(int fd, const void *data, size_t size, int *error)
    427       1.1  pooka {
    428       1.1  pooka 	ssize_t rv;
    429       1.1  pooka 
    430       1.1  pooka 	KLOCK_WRAP(rv = write(fd, data, size));
    431       1.1  pooka 	if (rv == -1)
    432      1.10  pooka 		seterror(errno);
    433       1.1  pooka 
    434       1.1  pooka 	return rv;
    435       1.1  pooka }
    436       1.1  pooka 
    437       1.1  pooka ssize_t
    438       1.1  pooka rumpuser_pwrite(int fd, const void *data, size_t size, off_t offset, int *error)
    439       1.1  pooka {
    440       1.1  pooka 	ssize_t rv;
    441       1.1  pooka 
    442       1.1  pooka 	KLOCK_WRAP(rv = pwrite(fd, data, size, offset));
    443       1.1  pooka 	if (rv == -1)
    444      1.10  pooka 		seterror(errno);
    445       1.1  pooka 
    446       1.1  pooka 	return rv;
    447       1.1  pooka }
    448       1.1  pooka 
    449       1.1  pooka void
    450       1.1  pooka rumpuser_write_bio(int fd, const void *data, size_t size, off_t offset,
    451       1.1  pooka 	rump_biodone_fn biodone, void *biodonecookie)
    452       1.1  pooka {
    453       1.1  pooka 	ssize_t rv;
    454       1.1  pooka 	int error = 0;
    455       1.1  pooka 
    456       1.1  pooka 	rv = rumpuser_pwrite(fd, data, size, offset, &error);
    457       1.1  pooka 	/* check against <0 instead of ==-1 to get typing below right */
    458       1.1  pooka 	if (rv < 0)
    459       1.1  pooka 		rv = 0;
    460       1.1  pooka 
    461       1.1  pooka 	/* LINTED: see above */
    462       1.1  pooka 	biodone(biodonecookie, rv, error);
    463       1.1  pooka }
    464       1.1  pooka 
    465       1.1  pooka ssize_t
    466       1.1  pooka rumpuser_readv(int fd, const struct rumpuser_iovec *riov, int iovcnt,
    467       1.1  pooka 	int *error)
    468       1.1  pooka {
    469       1.1  pooka 	struct iovec *iovp;
    470       1.1  pooka 	ssize_t rv;
    471       1.1  pooka 	int i;
    472       1.1  pooka 
    473       1.1  pooka 	iovp = malloc(iovcnt * sizeof(struct iovec));
    474       1.1  pooka 	if (iovp == NULL) {
    475      1.10  pooka 		seterror(ENOMEM);
    476       1.1  pooka 		return -1;
    477       1.1  pooka 	}
    478       1.1  pooka 	for (i = 0; i < iovcnt; i++) {
    479       1.1  pooka 		iovp[i].iov_base = riov[i].iov_base;
    480       1.1  pooka 		/*LINTED*/
    481       1.1  pooka 		iovp[i].iov_len = riov[i].iov_len;
    482       1.1  pooka 	}
    483       1.1  pooka 
    484       1.1  pooka 	KLOCK_WRAP(rv = readv(fd, iovp, iovcnt));
    485       1.1  pooka 	if (rv == -1)
    486      1.10  pooka 		seterror(errno);
    487       1.1  pooka 	free(iovp);
    488       1.1  pooka 
    489       1.1  pooka 	return rv;
    490       1.1  pooka }
    491       1.1  pooka 
    492       1.1  pooka ssize_t
    493       1.1  pooka rumpuser_writev(int fd, const struct rumpuser_iovec *riov, int iovcnt,
    494       1.1  pooka 	int *error)
    495       1.1  pooka {
    496       1.1  pooka 	struct iovec *iovp;
    497       1.1  pooka 	ssize_t rv;
    498       1.1  pooka 	int i;
    499       1.1  pooka 
    500       1.1  pooka 	iovp = malloc(iovcnt * sizeof(struct iovec));
    501       1.1  pooka 	if (iovp == NULL) {
    502      1.10  pooka 		seterror(ENOMEM);
    503       1.1  pooka 		return -1;
    504       1.1  pooka 	}
    505       1.1  pooka 	for (i = 0; i < iovcnt; i++) {
    506       1.1  pooka 		iovp[i].iov_base = riov[i].iov_base;
    507       1.1  pooka 		/*LINTED*/
    508       1.1  pooka 		iovp[i].iov_len = riov[i].iov_len;
    509       1.1  pooka 	}
    510       1.1  pooka 
    511       1.1  pooka 	KLOCK_WRAP(rv = writev(fd, iovp, iovcnt));
    512       1.1  pooka 	if (rv == -1)
    513      1.10  pooka 		seterror(errno);
    514       1.1  pooka 	free(iovp);
    515       1.1  pooka 
    516       1.1  pooka 	return rv;
    517       1.1  pooka }
    518       1.1  pooka 
    519       1.1  pooka int
    520       1.1  pooka rumpuser_gettime(uint64_t *sec, uint64_t *nsec, int *error)
    521       1.1  pooka {
    522       1.1  pooka 	struct timeval tv;
    523       1.1  pooka 	int rv;
    524       1.1  pooka 
    525       1.1  pooka 	rv = gettimeofday(&tv, NULL);
    526       1.1  pooka 	if (rv == -1) {
    527      1.10  pooka 		seterror(errno);
    528       1.1  pooka 		return rv;
    529       1.1  pooka 	}
    530       1.1  pooka 
    531       1.1  pooka 	*sec = tv.tv_sec;
    532       1.1  pooka 	*nsec = tv.tv_usec * 1000;
    533       1.1  pooka 
    534       1.1  pooka 	return 0;
    535       1.1  pooka }
    536       1.1  pooka 
    537       1.1  pooka int
    538       1.1  pooka rumpuser_getenv(const char *name, char *buf, size_t blen, int *error)
    539       1.1  pooka {
    540       1.1  pooka 
    541       1.1  pooka 	DOCALL(int, getenv_r(name, buf, blen));
    542       1.1  pooka }
    543       1.1  pooka 
    544       1.1  pooka int
    545       1.1  pooka rumpuser_gethostname(char *name, size_t namelen, int *error)
    546       1.1  pooka {
    547      1.13  pooka 	char tmp[MAXHOSTNAMELEN];
    548       1.1  pooka 
    549      1.13  pooka 	if (gethostname(tmp, sizeof(tmp)) == -1) {
    550  1.15.4.3   yamt 		snprintf(name, namelen, "rump-%05d.rumpdomain", (int)getpid());
    551      1.13  pooka 	} else {
    552      1.13  pooka 		snprintf(name, namelen, "rump-%05d.%s.rumpdomain",
    553  1.15.4.3   yamt 		    (int)getpid(), tmp);
    554      1.13  pooka 	}
    555      1.13  pooka 
    556      1.13  pooka 	*error = 0;
    557      1.13  pooka 	return 0;
    558       1.1  pooka }
    559       1.1  pooka 
    560       1.1  pooka int
    561       1.1  pooka rumpuser_poll(struct pollfd *fds, int nfds, int timeout, int *error)
    562       1.1  pooka {
    563       1.1  pooka 
    564       1.1  pooka 	DOCALL_KLOCK(int, (poll(fds, (nfds_t)nfds, timeout)));
    565       1.1  pooka }
    566       1.1  pooka 
    567       1.1  pooka int
    568       1.1  pooka rumpuser_putchar(int c, int *error)
    569       1.1  pooka {
    570       1.1  pooka 
    571       1.1  pooka 	DOCALL(int, (putchar(c)));
    572       1.1  pooka }
    573       1.1  pooka 
    574       1.1  pooka void
    575       1.1  pooka rumpuser_exit(int rv)
    576       1.1  pooka {
    577       1.1  pooka 
    578       1.1  pooka 	if (rv == RUMPUSER_PANIC)
    579       1.1  pooka 		abort();
    580       1.1  pooka 	else
    581       1.1  pooka 		exit(rv);
    582       1.1  pooka }
    583       1.1  pooka 
    584       1.1  pooka void
    585       1.1  pooka rumpuser_seterrno(int error)
    586       1.1  pooka {
    587       1.1  pooka 
    588       1.1  pooka 	errno = error;
    589       1.1  pooka }
    590       1.1  pooka 
    591  1.15.4.2   yamt /*
    592  1.15.4.2   yamt  * On NetBSD we use kqueue, on Linux we use inotify.  The underlying
    593  1.15.4.2   yamt  * interface requirements aren't quite the same, but we have a very
    594  1.15.4.2   yamt  * good chance of doing the fd->path mapping on Linux thanks to dcache,
    595  1.15.4.2   yamt  * so just keep the existing interfaces for now.
    596  1.15.4.2   yamt  */
    597  1.15.4.2   yamt #if defined(__NetBSD__)
    598       1.1  pooka int
    599       1.1  pooka rumpuser_writewatchfile_setup(int kq, int fd, intptr_t opaque, int *error)
    600       1.1  pooka {
    601       1.1  pooka 	struct kevent kev;
    602       1.1  pooka 
    603       1.1  pooka 	if (kq == -1) {
    604       1.1  pooka 		kq = kqueue();
    605       1.1  pooka 		if (kq == -1) {
    606      1.10  pooka 			seterror(errno);
    607       1.1  pooka 			return -1;
    608       1.1  pooka 		}
    609       1.1  pooka 	}
    610       1.1  pooka 
    611       1.1  pooka 	EV_SET(&kev, fd, EVFILT_VNODE, EV_ADD|EV_ENABLE|EV_CLEAR,
    612       1.1  pooka 	    NOTE_WRITE, 0, opaque);
    613       1.1  pooka 	if (kevent(kq, &kev, 1, NULL, 0, NULL) == -1) {
    614      1.10  pooka 		seterror(errno);
    615       1.1  pooka 		return -1;
    616       1.1  pooka 	}
    617       1.1  pooka 
    618       1.1  pooka 	return kq;
    619       1.1  pooka }
    620       1.1  pooka 
    621       1.1  pooka int
    622       1.1  pooka rumpuser_writewatchfile_wait(int kq, intptr_t *opaque, int *error)
    623       1.1  pooka {
    624       1.1  pooka 	struct kevent kev;
    625       1.1  pooka 	int rv;
    626       1.1  pooka 
    627       1.9  pooka  again:
    628       1.1  pooka 	KLOCK_WRAP(rv = kevent(kq, NULL, 0, &kev, 1, NULL));
    629       1.1  pooka 	if (rv == -1) {
    630       1.9  pooka 		if (errno == EINTR)
    631       1.9  pooka 			goto again;
    632      1.10  pooka 		seterror(errno);
    633       1.1  pooka 		return -1;
    634       1.1  pooka 	}
    635       1.1  pooka 
    636       1.1  pooka 	if (opaque)
    637       1.1  pooka 		*opaque = kev.udata;
    638       1.1  pooka 	return rv;
    639       1.1  pooka }
    640       1.1  pooka 
    641  1.15.4.2   yamt #elif defined(__linux__)
    642  1.15.4.2   yamt #include <sys/inotify.h>
    643  1.15.4.2   yamt 
    644  1.15.4.2   yamt int
    645  1.15.4.2   yamt rumpuser_writewatchfile_setup(int inotify, int fd, intptr_t notused, int *error)
    646  1.15.4.2   yamt {
    647  1.15.4.2   yamt 	char procbuf[PATH_MAX], linkbuf[PATH_MAX];
    648  1.15.4.2   yamt 	ssize_t nn;
    649  1.15.4.2   yamt 
    650  1.15.4.2   yamt 	if (inotify == -1) {
    651  1.15.4.2   yamt 		inotify = inotify_init();
    652  1.15.4.2   yamt 		if (inotify == -1) {
    653  1.15.4.2   yamt 			seterror(errno);
    654  1.15.4.2   yamt 			return -1;
    655  1.15.4.2   yamt 		}
    656  1.15.4.2   yamt 	}
    657  1.15.4.2   yamt 
    658  1.15.4.2   yamt 	/* ok, need to map fd into path for inotify */
    659  1.15.4.2   yamt 	snprintf(procbuf, sizeof(procbuf), "/proc/self/fd/%d", fd);
    660  1.15.4.2   yamt 	nn = readlink(procbuf, linkbuf, sizeof(linkbuf));
    661  1.15.4.2   yamt 	if (nn >= (ssize_t)sizeof(linkbuf)) {
    662  1.15.4.2   yamt 		nn = -1;
    663  1.15.4.2   yamt 		errno = E2BIG; /* pick something */
    664  1.15.4.2   yamt 	}
    665  1.15.4.2   yamt 	if (nn == -1) {
    666  1.15.4.2   yamt 		seterror(errno);
    667  1.15.4.2   yamt 		close(inotify);
    668  1.15.4.2   yamt 		return -1;
    669  1.15.4.2   yamt 	}
    670  1.15.4.2   yamt 
    671  1.15.4.2   yamt 	if (inotify_add_watch(inotify, linkbuf, IN_MODIFY) == -1) {
    672  1.15.4.2   yamt 		seterror(errno);
    673  1.15.4.2   yamt 		close(inotify);
    674  1.15.4.2   yamt 		return -1;
    675  1.15.4.2   yamt 	}
    676  1.15.4.2   yamt 
    677  1.15.4.2   yamt 	return inotify;
    678  1.15.4.2   yamt }
    679  1.15.4.2   yamt 
    680  1.15.4.2   yamt int
    681  1.15.4.2   yamt rumpuser_writewatchfile_wait(int kq, intptr_t *opaque, int *error)
    682  1.15.4.2   yamt {
    683  1.15.4.2   yamt 	struct inotify_event iev;
    684  1.15.4.2   yamt 	ssize_t nn;
    685  1.15.4.2   yamt 
    686  1.15.4.2   yamt 	do {
    687  1.15.4.2   yamt 		KLOCK_WRAP(nn = read(kq, &iev, sizeof(iev)));
    688  1.15.4.2   yamt 	} while (errno == EINTR);
    689  1.15.4.2   yamt 
    690  1.15.4.2   yamt 	if (nn == -1) {
    691  1.15.4.2   yamt 		seterror(errno);
    692  1.15.4.2   yamt 		return -1;
    693  1.15.4.2   yamt 	}
    694  1.15.4.2   yamt 	return (nn/sizeof(iev));
    695  1.15.4.2   yamt }
    696  1.15.4.2   yamt #endif
    697  1.15.4.2   yamt 
    698       1.1  pooka /*
    699       1.1  pooka  * This is meant for safe debugging prints from the kernel.
    700       1.1  pooka  */
    701       1.1  pooka int
    702       1.1  pooka rumpuser_dprintf(const char *format, ...)
    703       1.1  pooka {
    704       1.1  pooka 	va_list ap;
    705       1.1  pooka 	int rv;
    706       1.1  pooka 
    707       1.1  pooka 	va_start(ap, format);
    708       1.9  pooka 	rv = vfprintf(stderr, format, ap);
    709       1.1  pooka 	va_end(ap);
    710       1.1  pooka 
    711       1.1  pooka 	return rv;
    712       1.1  pooka }
    713       1.2  pooka 
    714       1.2  pooka int
    715       1.2  pooka rumpuser_kill(int64_t pid, int sig, int *error)
    716       1.2  pooka {
    717       1.2  pooka 
    718       1.3  pooka #ifdef __NetBSD__
    719       1.2  pooka 	if (pid == RUMPUSER_PID_SELF) {
    720       1.2  pooka 		DOCALL(int, raise(sig));
    721       1.2  pooka 	} else {
    722       1.2  pooka 		DOCALL(int, kill((pid_t)pid, sig));
    723       1.2  pooka 	}
    724       1.3  pooka #else
    725       1.3  pooka 	/* XXXfixme: signal numbers may not match on non-NetBSD */
    726      1.10  pooka 	seterror(EOPNOTSUPP);
    727       1.3  pooka 	return -1;
    728       1.3  pooka #endif
    729       1.2  pooka }
    730       1.4  pooka 
    731       1.4  pooka int
    732       1.4  pooka rumpuser_getnhostcpu(void)
    733       1.4  pooka {
    734  1.15.4.2   yamt 	int ncpu = 1;
    735       1.4  pooka 
    736       1.4  pooka #ifdef __NetBSD__
    737  1.15.4.2   yamt 	size_t sz = sizeof(ncpu);
    738  1.15.4.2   yamt 
    739  1.15.4.2   yamt 	sysctlbyname("hw.ncpu", &ncpu, &sz, NULL, 0);
    740  1.15.4.2   yamt #elif __linux__
    741  1.15.4.2   yamt 	FILE *fp;
    742  1.15.4.2   yamt 	char *line = NULL;
    743  1.15.4.2   yamt 	size_t n = 0;
    744  1.15.4.2   yamt 
    745  1.15.4.2   yamt 	/* If anyone knows a better way, I'm all ears */
    746  1.15.4.2   yamt 	if ((fp = fopen("/proc/cpuinfo", "r")) != NULL) {
    747  1.15.4.2   yamt 		ncpu = 0;
    748  1.15.4.2   yamt 		while (getline(&line, &n, fp) != -1) {
    749  1.15.4.2   yamt 			if (strncmp(line,
    750  1.15.4.2   yamt 			    "processor", sizeof("processor")-1) == 0)
    751  1.15.4.2   yamt 			    	ncpu++;
    752  1.15.4.2   yamt 		}
    753  1.15.4.2   yamt 		if (ncpu == 0)
    754  1.15.4.2   yamt 			ncpu = 1;
    755  1.15.4.2   yamt 		free(line);
    756  1.15.4.2   yamt 		fclose(fp);
    757  1.15.4.2   yamt 	}
    758  1.15.4.3   yamt #elif __sun__
    759  1.15.4.3   yamt 	/* XXX: this is just a rough estimate ... */
    760  1.15.4.3   yamt 	ncpu = sysconf(_SC_NPROCESSORS_ONLN);
    761       1.4  pooka #endif
    762  1.15.4.2   yamt 
    763  1.15.4.2   yamt 	return ncpu;
    764       1.4  pooka }
    765  1.15.4.1   yamt 
    766  1.15.4.2   yamt /* XXX: this hypercall needs a better name */
    767  1.15.4.1   yamt uint32_t
    768  1.15.4.1   yamt rumpuser_arc4random(void)
    769  1.15.4.1   yamt {
    770  1.15.4.2   yamt 
    771  1.15.4.1   yamt 	return arc4random();
    772  1.15.4.1   yamt }
    773