Home | History | Annotate | Line # | Download | only in librumpuser
rumpuser.c revision 1.23
      1  1.23  pooka /*	$NetBSD: rumpuser.c,v 1.23 2012/11/18 19:29:40 pooka Exp $	*/
      2   1.1  pooka 
      3   1.1  pooka /*
      4   1.1  pooka  * Copyright (c) 2007-2010 Antti Kantee.  All Rights Reserved.
      5   1.1  pooka  *
      6   1.1  pooka  * Redistribution and use in source and binary forms, with or without
      7   1.1  pooka  * modification, are permitted provided that the following conditions
      8   1.1  pooka  * are met:
      9   1.1  pooka  * 1. Redistributions of source code must retain the above copyright
     10   1.1  pooka  *    notice, this list of conditions and the following disclaimer.
     11   1.1  pooka  * 2. Redistributions in binary form must reproduce the above copyright
     12   1.1  pooka  *    notice, this list of conditions and the following disclaimer in the
     13   1.1  pooka  *    documentation and/or other materials provided with the distribution.
     14   1.1  pooka  *
     15   1.1  pooka  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
     16   1.1  pooka  * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
     17   1.1  pooka  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
     18   1.1  pooka  * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     19   1.1  pooka  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     20   1.1  pooka  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
     21   1.1  pooka  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     22   1.1  pooka  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     23   1.1  pooka  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     24   1.1  pooka  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     25   1.1  pooka  * SUCH DAMAGE.
     26   1.1  pooka  */
     27   1.1  pooka 
     28  1.18  pooka #include "rumpuser_port.h"
     29  1.18  pooka 
     30   1.1  pooka #if !defined(lint)
     31  1.23  pooka __RCSID("$NetBSD: rumpuser.c,v 1.23 2012/11/18 19:29:40 pooka Exp $");
     32   1.1  pooka #endif /* !lint */
     33   1.1  pooka 
     34   1.1  pooka #include <sys/ioctl.h>
     35   1.1  pooka #include <sys/mman.h>
     36   1.1  pooka #include <sys/uio.h>
     37  1.18  pooka #include <sys/stat.h>
     38  1.18  pooka #include <sys/time.h>
     39   1.1  pooka 
     40   1.1  pooka #ifdef __NetBSD__
     41  1.15  pooka #include <sys/disk.h>
     42   1.1  pooka #include <sys/disklabel.h>
     43  1.15  pooka #include <sys/dkio.h>
     44   1.4  pooka #include <sys/sysctl.h>
     45  1.18  pooka #include <sys/event.h>
     46   1.1  pooka #endif
     47   1.1  pooka 
     48   1.1  pooka #include <assert.h>
     49   1.1  pooka #include <errno.h>
     50   1.1  pooka #include <fcntl.h>
     51  1.23  pooka #include <netdb.h>
     52   1.1  pooka #include <poll.h>
     53   1.2  pooka #include <signal.h>
     54   1.1  pooka #include <stdarg.h>
     55   1.1  pooka #include <stdint.h>
     56   1.1  pooka #include <stdio.h>
     57   1.1  pooka #include <stdlib.h>
     58   1.1  pooka #include <string.h>
     59   1.1  pooka #include <time.h>
     60   1.1  pooka #include <unistd.h>
     61   1.1  pooka 
     62   1.1  pooka #include <rump/rumpuser.h>
     63   1.1  pooka 
     64   1.1  pooka #include "rumpuser_int.h"
     65   1.1  pooka 
     66   1.1  pooka int
     67  1.17    abs rumpuser_getversion(void)
     68   1.8  pooka {
     69   1.8  pooka 
     70   1.8  pooka 	return RUMPUSER_VERSION;
     71   1.8  pooka }
     72   1.8  pooka 
     73   1.8  pooka int
     74   1.1  pooka rumpuser_getfileinfo(const char *path, uint64_t *sizep, int *ftp, int *error)
     75   1.1  pooka {
     76   1.1  pooka 	struct stat sb;
     77   1.1  pooka 	uint64_t size;
     78   1.1  pooka 	int needsdev = 0, rv = 0, ft;
     79  1.12  pooka 	int fd = -1;
     80   1.1  pooka 
     81   1.1  pooka 	if (stat(path, &sb) == -1) {
     82  1.10  pooka 		seterror(errno);
     83   1.1  pooka 		return -1;
     84   1.1  pooka 	}
     85   1.1  pooka 
     86   1.1  pooka 	switch (sb.st_mode & S_IFMT) {
     87   1.1  pooka 	case S_IFDIR:
     88   1.1  pooka 		ft = RUMPUSER_FT_DIR;
     89   1.1  pooka 		break;
     90   1.1  pooka 	case S_IFREG:
     91   1.1  pooka 		ft = RUMPUSER_FT_REG;
     92   1.1  pooka 		break;
     93   1.1  pooka 	case S_IFBLK:
     94   1.1  pooka 		ft = RUMPUSER_FT_BLK;
     95   1.1  pooka 		needsdev = 1;
     96   1.1  pooka 		break;
     97   1.1  pooka 	case S_IFCHR:
     98   1.1  pooka 		ft = RUMPUSER_FT_CHR;
     99   1.1  pooka 		needsdev = 1;
    100   1.1  pooka 		break;
    101   1.1  pooka 	default:
    102   1.1  pooka 		ft = RUMPUSER_FT_OTHER;
    103   1.1  pooka 		break;
    104   1.1  pooka 	}
    105   1.1  pooka 
    106   1.1  pooka 	if (!needsdev) {
    107   1.1  pooka 		size = sb.st_size;
    108   1.1  pooka 	} else if (sizep) {
    109   1.1  pooka 		/*
    110   1.1  pooka 		 * Welcome to the jungle.  Of course querying the kernel
    111   1.1  pooka 		 * for a device partition size is supposed to be far from
    112   1.1  pooka 		 * trivial.  On NetBSD we use ioctl.  On $other platform
    113   1.1  pooka 		 * we have a problem.  We try "the lseek trick" and just
    114   1.1  pooka 		 * fail if that fails.  Platform specific code can later
    115   1.1  pooka 		 * be written here if appropriate.
    116   1.1  pooka 		 *
    117   1.1  pooka 		 * On NetBSD we hope and pray that for block devices nobody
    118   1.1  pooka 		 * else is holding them open, because otherwise the kernel
    119   1.1  pooka 		 * will not permit us to open it.  Thankfully, this is
    120   1.1  pooka 		 * usually called only in bootstrap and then we can
    121   1.1  pooka 		 * forget about it.
    122   1.1  pooka 		 */
    123   1.1  pooka #ifndef __NetBSD__
    124   1.1  pooka 		off_t off;
    125   1.1  pooka 
    126   1.1  pooka 		fd = open(path, O_RDONLY);
    127   1.1  pooka 		if (fd == -1) {
    128  1.10  pooka 			seterror(errno);
    129   1.1  pooka 			rv = -1;
    130   1.1  pooka 			goto out;
    131   1.1  pooka 		}
    132   1.1  pooka 
    133   1.1  pooka 		off = lseek(fd, 0, SEEK_END);
    134   1.1  pooka 		if (off != 0) {
    135   1.1  pooka 			size = off;
    136   1.1  pooka 			goto out;
    137   1.1  pooka 		}
    138   1.1  pooka 		fprintf(stderr, "error: device size query not implemented on "
    139   1.1  pooka 		    "this platform\n");
    140  1.12  pooka 		seterror(EOPNOTSUPP);
    141   1.1  pooka 		rv = -1;
    142   1.1  pooka 		goto out;
    143   1.1  pooka #else
    144   1.1  pooka 		struct disklabel lab;
    145   1.1  pooka 		struct partition *parta;
    146  1.15  pooka 		struct dkwedge_info dkw;
    147   1.1  pooka 
    148   1.1  pooka 		fd = open(path, O_RDONLY);
    149   1.1  pooka 		if (fd == -1) {
    150  1.10  pooka 			seterror(errno);
    151   1.1  pooka 			rv = -1;
    152   1.1  pooka 			goto out;
    153   1.1  pooka 		}
    154   1.1  pooka 
    155  1.15  pooka 		if (ioctl(fd, DIOCGDINFO, &lab) == 0) {
    156  1.15  pooka 			parta = &lab.d_partitions[DISKPART(sb.st_rdev)];
    157  1.15  pooka 			size = (uint64_t)lab.d_secsize * parta->p_size;
    158  1.15  pooka 			goto out;
    159  1.15  pooka 		}
    160  1.15  pooka 
    161  1.15  pooka 		if (ioctl(fd, DIOCGWEDGEINFO, &dkw) == 0) {
    162  1.15  pooka 			/*
    163  1.15  pooka 			 * XXX: should use DIOCGDISKINFO to query
    164  1.15  pooka 			 * sector size, but that requires proplib,
    165  1.15  pooka 			 * so just don't bother for now.  it's nice
    166  1.15  pooka 			 * that something as difficult as figuring out
    167  1.15  pooka 			 * a partition's size has been made so easy.
    168  1.15  pooka 			 */
    169  1.15  pooka 			size = dkw.dkw_size << DEV_BSHIFT;
    170   1.1  pooka 			goto out;
    171   1.1  pooka 		}
    172   1.1  pooka 
    173  1.15  pooka 		seterror(errno);
    174  1.15  pooka 		rv = -1;
    175   1.1  pooka #endif /* __NetBSD__ */
    176   1.1  pooka 	}
    177   1.1  pooka 
    178   1.1  pooka  out:
    179   1.1  pooka 	if (rv == 0 && sizep)
    180   1.1  pooka 		*sizep = size;
    181   1.1  pooka 	if (rv == 0 && ftp)
    182   1.1  pooka 		*ftp = ft;
    183  1.12  pooka 	if (fd != -1)
    184  1.12  pooka 		close(fd);
    185   1.1  pooka 
    186   1.1  pooka 	return rv;
    187   1.1  pooka }
    188   1.1  pooka 
    189   1.1  pooka int
    190   1.1  pooka rumpuser_nanosleep(uint64_t *sec, uint64_t *nsec, int *error)
    191   1.1  pooka {
    192   1.1  pooka 	struct timespec rqt, rmt;
    193   1.1  pooka 	int rv;
    194   1.1  pooka 
    195   1.1  pooka 	/*LINTED*/
    196   1.1  pooka 	rqt.tv_sec = *sec;
    197   1.1  pooka 	/*LINTED*/
    198   1.1  pooka 	rqt.tv_nsec = *nsec;
    199   1.1  pooka 
    200   1.1  pooka 	KLOCK_WRAP(rv = nanosleep(&rqt, &rmt));
    201   1.1  pooka 	if (rv == -1)
    202  1.10  pooka 		seterror(errno);
    203   1.1  pooka 
    204   1.1  pooka 	*sec = rmt.tv_sec;
    205   1.1  pooka 	*nsec = rmt.tv_nsec;
    206   1.1  pooka 
    207   1.1  pooka 	return rv;
    208   1.1  pooka }
    209   1.1  pooka 
    210   1.1  pooka void *
    211   1.5  pooka rumpuser_malloc(size_t howmuch, int alignment)
    212   1.1  pooka {
    213   1.5  pooka 	void *mem;
    214   1.6  pooka 	int rv;
    215   1.5  pooka 
    216   1.5  pooka 	if (alignment == 0)
    217   1.5  pooka 		alignment = sizeof(void *);
    218   1.1  pooka 
    219  1.14  pooka 	rv = posix_memalign(&mem, (size_t)alignment, howmuch);
    220   1.6  pooka 	if (__predict_false(rv != 0)) {
    221   1.6  pooka 		if (rv == EINVAL) {
    222   1.6  pooka 			printf("rumpuser_malloc: invalid alignment %d\n",
    223   1.6  pooka 			    alignment);
    224   1.6  pooka 			abort();
    225   1.6  pooka 		}
    226   1.6  pooka 		mem = NULL;
    227   1.6  pooka 	}
    228   1.1  pooka 
    229   1.5  pooka 	return mem;
    230   1.1  pooka }
    231   1.1  pooka 
    232   1.1  pooka void *
    233   1.5  pooka rumpuser_realloc(void *ptr, size_t howmuch)
    234   1.1  pooka {
    235   1.1  pooka 
    236   1.5  pooka 	return realloc(ptr, howmuch);
    237   1.1  pooka }
    238   1.1  pooka 
    239   1.1  pooka void
    240   1.1  pooka rumpuser_free(void *ptr)
    241   1.1  pooka {
    242   1.1  pooka 
    243   1.1  pooka 	free(ptr);
    244   1.1  pooka }
    245   1.1  pooka 
    246   1.1  pooka void *
    247   1.7  pooka rumpuser_anonmmap(void *prefaddr, size_t size, int alignbit,
    248   1.7  pooka 	int exec, int *error)
    249   1.1  pooka {
    250   1.1  pooka 	void *rv;
    251   1.1  pooka 	int prot;
    252   1.1  pooka 
    253  1.18  pooka #ifndef MAP_ALIGNED
    254  1.18  pooka #define MAP_ALIGNED(a) 0
    255  1.18  pooka 	if (alignbit)
    256  1.18  pooka 		fprintf(stderr, "rumpuser_anonmmap: warning, requested "
    257  1.18  pooka 		    "alignment not supported by hypervisor\n");
    258  1.18  pooka #endif
    259  1.18  pooka 
    260   1.1  pooka 	prot = PROT_READ|PROT_WRITE;
    261   1.1  pooka 	if (exec)
    262   1.1  pooka 		prot |= PROT_EXEC;
    263   1.7  pooka 	rv = mmap(prefaddr, size, prot,
    264   1.7  pooka 	    MAP_ANON | MAP_ALIGNED(alignbit), -1, 0);
    265   1.1  pooka 	if (rv == MAP_FAILED) {
    266  1.10  pooka 		seterror(errno);
    267   1.1  pooka 		return NULL;
    268   1.1  pooka 	}
    269   1.1  pooka 	return rv;
    270   1.1  pooka }
    271   1.1  pooka 
    272   1.1  pooka void
    273   1.1  pooka rumpuser_unmap(void *addr, size_t len)
    274   1.1  pooka {
    275   1.1  pooka 	int rv;
    276   1.1  pooka 
    277   1.1  pooka 	rv = munmap(addr, len);
    278   1.1  pooka 	assert(rv == 0);
    279   1.1  pooka }
    280   1.1  pooka 
    281   1.1  pooka void *
    282   1.1  pooka rumpuser_filemmap(int fd, off_t offset, size_t len, int flags, int *error)
    283   1.1  pooka {
    284   1.1  pooka 	void *rv;
    285   1.1  pooka 	int mmflags, prot;
    286   1.1  pooka 
    287  1.22  pooka 	if (flags & RUMPUSER_FILEMMAP_TRUNCATE) {
    288  1.22  pooka 		if (ftruncate(fd, offset + len) == -1) {
    289  1.22  pooka 			seterror(errno);
    290  1.22  pooka 			return NULL;
    291  1.22  pooka 		}
    292  1.22  pooka 	}
    293   1.1  pooka 
    294  1.23  pooka /* it's implicit */
    295  1.23  pooka #if defined(__sun__) && !defined(MAP_FILE)
    296  1.23  pooka #define MAP_FILE 0
    297  1.23  pooka #endif
    298  1.23  pooka 
    299   1.1  pooka 	mmflags = MAP_FILE;
    300   1.1  pooka 	if (flags & RUMPUSER_FILEMMAP_SHARED)
    301   1.1  pooka 		mmflags |= MAP_SHARED;
    302   1.1  pooka 	else
    303   1.1  pooka 		mmflags |= MAP_PRIVATE;
    304   1.1  pooka 
    305   1.1  pooka 	prot = 0;
    306   1.1  pooka 	if (flags & RUMPUSER_FILEMMAP_READ)
    307   1.1  pooka 		prot |= PROT_READ;
    308   1.1  pooka 	if (flags & RUMPUSER_FILEMMAP_WRITE)
    309   1.1  pooka 		prot |= PROT_WRITE;
    310   1.1  pooka 
    311   1.1  pooka 	rv = mmap(NULL, len, PROT_READ|PROT_WRITE, mmflags, fd, offset);
    312   1.1  pooka 	if (rv == MAP_FAILED) {
    313  1.10  pooka 		seterror(errno);
    314   1.1  pooka 		return NULL;
    315   1.1  pooka 	}
    316   1.1  pooka 
    317  1.10  pooka 	seterror(0);
    318   1.1  pooka 	return rv;
    319   1.1  pooka }
    320   1.1  pooka 
    321   1.1  pooka int
    322   1.1  pooka rumpuser_memsync(void *addr, size_t len, int *error)
    323   1.1  pooka {
    324   1.1  pooka 
    325   1.1  pooka 	DOCALL_KLOCK(int, (msync(addr, len, MS_SYNC)));
    326   1.1  pooka }
    327   1.1  pooka 
    328   1.1  pooka int
    329  1.20  pooka rumpuser_open(const char *path, int ruflags, int *error)
    330   1.1  pooka {
    331  1.20  pooka 	int flags;
    332   1.1  pooka 
    333  1.20  pooka 	switch (ruflags & RUMPUSER_OPEN_ACCMODE) {
    334  1.20  pooka 	case RUMPUSER_OPEN_RDONLY:
    335  1.20  pooka 		flags = O_RDONLY;
    336  1.20  pooka 		break;
    337  1.20  pooka 	case RUMPUSER_OPEN_WRONLY:
    338  1.20  pooka 		flags = O_WRONLY;
    339  1.20  pooka 		break;
    340  1.20  pooka 	case RUMPUSER_OPEN_RDWR:
    341  1.20  pooka 		flags = O_RDWR;
    342  1.20  pooka 		break;
    343  1.20  pooka 	default:
    344  1.20  pooka 		*error = EINVAL;
    345  1.20  pooka 		return -1;
    346  1.20  pooka 	}
    347  1.20  pooka 
    348  1.20  pooka #define TESTSET(_ru_, _h_) if (ruflags & _ru_) flags |= _h_;
    349  1.20  pooka 	TESTSET(RUMPUSER_OPEN_CREATE, O_CREAT);
    350  1.20  pooka 	TESTSET(RUMPUSER_OPEN_EXCL, O_EXCL);
    351  1.23  pooka #ifdef O_DIRECT
    352  1.20  pooka 	TESTSET(RUMPUSER_OPEN_DIRECT, O_DIRECT);
    353  1.23  pooka #else
    354  1.23  pooka 	if (ruflags & RUMPUSER_OPEN_DIRECT) {
    355  1.23  pooka 		*error = EOPNOTSUPP;
    356  1.23  pooka 		return -1;
    357  1.23  pooka 	}
    358  1.23  pooka #endif
    359  1.20  pooka #undef TESTSET
    360  1.20  pooka 
    361  1.20  pooka 	DOCALL_KLOCK(int, (open(path, flags, 0644)));
    362   1.1  pooka }
    363   1.1  pooka 
    364   1.1  pooka int
    365   1.1  pooka rumpuser_ioctl(int fd, u_long cmd, void *data, int *error)
    366   1.1  pooka {
    367   1.1  pooka 
    368   1.1  pooka 	DOCALL_KLOCK(int, (ioctl(fd, cmd, data)));
    369   1.1  pooka }
    370   1.1  pooka 
    371   1.1  pooka int
    372   1.1  pooka rumpuser_close(int fd, int *error)
    373   1.1  pooka {
    374   1.1  pooka 
    375   1.1  pooka 	DOCALL(int, close(fd));
    376   1.1  pooka }
    377   1.1  pooka 
    378   1.1  pooka int
    379   1.1  pooka rumpuser_fsync(int fd, int *error)
    380   1.1  pooka {
    381   1.1  pooka 
    382   1.1  pooka 	DOCALL_KLOCK(int, fsync(fd));
    383   1.1  pooka }
    384   1.1  pooka 
    385   1.1  pooka ssize_t
    386   1.1  pooka rumpuser_read(int fd, void *data, size_t size, int *error)
    387   1.1  pooka {
    388   1.1  pooka 	ssize_t rv;
    389   1.1  pooka 
    390   1.1  pooka 	KLOCK_WRAP(rv = read(fd, data, size));
    391   1.1  pooka 	if (rv == -1)
    392  1.10  pooka 		seterror(errno);
    393   1.1  pooka 
    394   1.1  pooka 	return rv;
    395   1.1  pooka }
    396   1.1  pooka 
    397   1.1  pooka ssize_t
    398   1.1  pooka rumpuser_pread(int fd, void *data, size_t size, off_t offset, int *error)
    399   1.1  pooka {
    400   1.1  pooka 	ssize_t rv;
    401   1.1  pooka 
    402   1.1  pooka 	KLOCK_WRAP(rv = pread(fd, data, size, offset));
    403   1.1  pooka 	if (rv == -1)
    404  1.10  pooka 		seterror(errno);
    405   1.1  pooka 
    406   1.1  pooka 	return rv;
    407   1.1  pooka }
    408   1.1  pooka 
    409   1.1  pooka void
    410   1.1  pooka rumpuser_read_bio(int fd, void *data, size_t size, off_t offset,
    411   1.1  pooka 	rump_biodone_fn biodone, void *biodonecookie)
    412   1.1  pooka {
    413   1.1  pooka 	ssize_t rv;
    414   1.1  pooka 	int error = 0;
    415   1.1  pooka 
    416   1.1  pooka 	rv = rumpuser_pread(fd, data, size, offset, &error);
    417   1.1  pooka 	/* check against <0 instead of ==-1 to get typing below right */
    418   1.1  pooka 	if (rv < 0)
    419   1.1  pooka 		rv = 0;
    420   1.1  pooka 
    421   1.1  pooka 	/* LINTED: see above */
    422   1.1  pooka 	biodone(biodonecookie, rv, error);
    423   1.1  pooka }
    424   1.1  pooka 
    425   1.1  pooka ssize_t
    426   1.1  pooka rumpuser_write(int fd, const void *data, size_t size, int *error)
    427   1.1  pooka {
    428   1.1  pooka 	ssize_t rv;
    429   1.1  pooka 
    430   1.1  pooka 	KLOCK_WRAP(rv = write(fd, data, size));
    431   1.1  pooka 	if (rv == -1)
    432  1.10  pooka 		seterror(errno);
    433   1.1  pooka 
    434   1.1  pooka 	return rv;
    435   1.1  pooka }
    436   1.1  pooka 
    437   1.1  pooka ssize_t
    438   1.1  pooka rumpuser_pwrite(int fd, const void *data, size_t size, off_t offset, int *error)
    439   1.1  pooka {
    440   1.1  pooka 	ssize_t rv;
    441   1.1  pooka 
    442   1.1  pooka 	KLOCK_WRAP(rv = pwrite(fd, data, size, offset));
    443   1.1  pooka 	if (rv == -1)
    444  1.10  pooka 		seterror(errno);
    445   1.1  pooka 
    446   1.1  pooka 	return rv;
    447   1.1  pooka }
    448   1.1  pooka 
    449   1.1  pooka void
    450   1.1  pooka rumpuser_write_bio(int fd, const void *data, size_t size, off_t offset,
    451   1.1  pooka 	rump_biodone_fn biodone, void *biodonecookie)
    452   1.1  pooka {
    453   1.1  pooka 	ssize_t rv;
    454   1.1  pooka 	int error = 0;
    455   1.1  pooka 
    456   1.1  pooka 	rv = rumpuser_pwrite(fd, data, size, offset, &error);
    457   1.1  pooka 	/* check against <0 instead of ==-1 to get typing below right */
    458   1.1  pooka 	if (rv < 0)
    459   1.1  pooka 		rv = 0;
    460   1.1  pooka 
    461   1.1  pooka 	/* LINTED: see above */
    462   1.1  pooka 	biodone(biodonecookie, rv, error);
    463   1.1  pooka }
    464   1.1  pooka 
    465   1.1  pooka ssize_t
    466   1.1  pooka rumpuser_readv(int fd, const struct rumpuser_iovec *riov, int iovcnt,
    467   1.1  pooka 	int *error)
    468   1.1  pooka {
    469   1.1  pooka 	struct iovec *iovp;
    470   1.1  pooka 	ssize_t rv;
    471   1.1  pooka 	int i;
    472   1.1  pooka 
    473   1.1  pooka 	iovp = malloc(iovcnt * sizeof(struct iovec));
    474   1.1  pooka 	if (iovp == NULL) {
    475  1.10  pooka 		seterror(ENOMEM);
    476   1.1  pooka 		return -1;
    477   1.1  pooka 	}
    478   1.1  pooka 	for (i = 0; i < iovcnt; i++) {
    479   1.1  pooka 		iovp[i].iov_base = riov[i].iov_base;
    480   1.1  pooka 		/*LINTED*/
    481   1.1  pooka 		iovp[i].iov_len = riov[i].iov_len;
    482   1.1  pooka 	}
    483   1.1  pooka 
    484   1.1  pooka 	KLOCK_WRAP(rv = readv(fd, iovp, iovcnt));
    485   1.1  pooka 	if (rv == -1)
    486  1.10  pooka 		seterror(errno);
    487   1.1  pooka 	free(iovp);
    488   1.1  pooka 
    489   1.1  pooka 	return rv;
    490   1.1  pooka }
    491   1.1  pooka 
    492   1.1  pooka ssize_t
    493   1.1  pooka rumpuser_writev(int fd, const struct rumpuser_iovec *riov, int iovcnt,
    494   1.1  pooka 	int *error)
    495   1.1  pooka {
    496   1.1  pooka 	struct iovec *iovp;
    497   1.1  pooka 	ssize_t rv;
    498   1.1  pooka 	int i;
    499   1.1  pooka 
    500   1.1  pooka 	iovp = malloc(iovcnt * sizeof(struct iovec));
    501   1.1  pooka 	if (iovp == NULL) {
    502  1.10  pooka 		seterror(ENOMEM);
    503   1.1  pooka 		return -1;
    504   1.1  pooka 	}
    505   1.1  pooka 	for (i = 0; i < iovcnt; i++) {
    506   1.1  pooka 		iovp[i].iov_base = riov[i].iov_base;
    507   1.1  pooka 		/*LINTED*/
    508   1.1  pooka 		iovp[i].iov_len = riov[i].iov_len;
    509   1.1  pooka 	}
    510   1.1  pooka 
    511   1.1  pooka 	KLOCK_WRAP(rv = writev(fd, iovp, iovcnt));
    512   1.1  pooka 	if (rv == -1)
    513  1.10  pooka 		seterror(errno);
    514   1.1  pooka 	free(iovp);
    515   1.1  pooka 
    516   1.1  pooka 	return rv;
    517   1.1  pooka }
    518   1.1  pooka 
    519   1.1  pooka int
    520   1.1  pooka rumpuser_gettime(uint64_t *sec, uint64_t *nsec, int *error)
    521   1.1  pooka {
    522   1.1  pooka 	struct timeval tv;
    523   1.1  pooka 	int rv;
    524   1.1  pooka 
    525   1.1  pooka 	rv = gettimeofday(&tv, NULL);
    526   1.1  pooka 	if (rv == -1) {
    527  1.10  pooka 		seterror(errno);
    528   1.1  pooka 		return rv;
    529   1.1  pooka 	}
    530   1.1  pooka 
    531   1.1  pooka 	*sec = tv.tv_sec;
    532   1.1  pooka 	*nsec = tv.tv_usec * 1000;
    533   1.1  pooka 
    534   1.1  pooka 	return 0;
    535   1.1  pooka }
    536   1.1  pooka 
    537   1.1  pooka int
    538   1.1  pooka rumpuser_getenv(const char *name, char *buf, size_t blen, int *error)
    539   1.1  pooka {
    540   1.1  pooka 
    541   1.1  pooka 	DOCALL(int, getenv_r(name, buf, blen));
    542   1.1  pooka }
    543   1.1  pooka 
    544   1.1  pooka int
    545   1.1  pooka rumpuser_gethostname(char *name, size_t namelen, int *error)
    546   1.1  pooka {
    547  1.13  pooka 	char tmp[MAXHOSTNAMELEN];
    548   1.1  pooka 
    549  1.13  pooka 	if (gethostname(tmp, sizeof(tmp)) == -1) {
    550  1.23  pooka 		snprintf(name, namelen, "rump-%05d.rumpdomain", (int)getpid());
    551  1.13  pooka 	} else {
    552  1.13  pooka 		snprintf(name, namelen, "rump-%05d.%s.rumpdomain",
    553  1.23  pooka 		    (int)getpid(), tmp);
    554  1.13  pooka 	}
    555  1.13  pooka 
    556  1.13  pooka 	*error = 0;
    557  1.13  pooka 	return 0;
    558   1.1  pooka }
    559   1.1  pooka 
    560   1.1  pooka int
    561   1.1  pooka rumpuser_poll(struct pollfd *fds, int nfds, int timeout, int *error)
    562   1.1  pooka {
    563   1.1  pooka 
    564   1.1  pooka 	DOCALL_KLOCK(int, (poll(fds, (nfds_t)nfds, timeout)));
    565   1.1  pooka }
    566   1.1  pooka 
    567   1.1  pooka int
    568   1.1  pooka rumpuser_putchar(int c, int *error)
    569   1.1  pooka {
    570   1.1  pooka 
    571   1.1  pooka 	DOCALL(int, (putchar(c)));
    572   1.1  pooka }
    573   1.1  pooka 
    574   1.1  pooka void
    575   1.1  pooka rumpuser_exit(int rv)
    576   1.1  pooka {
    577   1.1  pooka 
    578   1.1  pooka 	if (rv == RUMPUSER_PANIC)
    579   1.1  pooka 		abort();
    580   1.1  pooka 	else
    581   1.1  pooka 		exit(rv);
    582   1.1  pooka }
    583   1.1  pooka 
    584   1.1  pooka void
    585   1.1  pooka rumpuser_seterrno(int error)
    586   1.1  pooka {
    587   1.1  pooka 
    588   1.1  pooka 	errno = error;
    589   1.1  pooka }
    590   1.1  pooka 
    591  1.21  pooka /*
    592  1.21  pooka  * On NetBSD we use kqueue, on Linux we use inotify.  The underlying
    593  1.21  pooka  * interface requirements aren't quite the same, but we have a very
    594  1.21  pooka  * good chance of doing the fd->path mapping on Linux thanks to dcache,
    595  1.21  pooka  * so just keep the existing interfaces for now.
    596  1.21  pooka  */
    597  1.21  pooka #if defined(__NetBSD__)
    598   1.1  pooka int
    599   1.1  pooka rumpuser_writewatchfile_setup(int kq, int fd, intptr_t opaque, int *error)
    600   1.1  pooka {
    601   1.1  pooka 	struct kevent kev;
    602   1.1  pooka 
    603   1.1  pooka 	if (kq == -1) {
    604   1.1  pooka 		kq = kqueue();
    605   1.1  pooka 		if (kq == -1) {
    606  1.10  pooka 			seterror(errno);
    607   1.1  pooka 			return -1;
    608   1.1  pooka 		}
    609   1.1  pooka 	}
    610   1.1  pooka 
    611   1.1  pooka 	EV_SET(&kev, fd, EVFILT_VNODE, EV_ADD|EV_ENABLE|EV_CLEAR,
    612   1.1  pooka 	    NOTE_WRITE, 0, opaque);
    613   1.1  pooka 	if (kevent(kq, &kev, 1, NULL, 0, NULL) == -1) {
    614  1.10  pooka 		seterror(errno);
    615   1.1  pooka 		return -1;
    616   1.1  pooka 	}
    617   1.1  pooka 
    618   1.1  pooka 	return kq;
    619   1.1  pooka }
    620   1.1  pooka 
    621   1.1  pooka int
    622   1.1  pooka rumpuser_writewatchfile_wait(int kq, intptr_t *opaque, int *error)
    623   1.1  pooka {
    624   1.1  pooka 	struct kevent kev;
    625   1.1  pooka 	int rv;
    626   1.1  pooka 
    627   1.9  pooka  again:
    628   1.1  pooka 	KLOCK_WRAP(rv = kevent(kq, NULL, 0, &kev, 1, NULL));
    629   1.1  pooka 	if (rv == -1) {
    630   1.9  pooka 		if (errno == EINTR)
    631   1.9  pooka 			goto again;
    632  1.10  pooka 		seterror(errno);
    633   1.1  pooka 		return -1;
    634   1.1  pooka 	}
    635   1.1  pooka 
    636   1.1  pooka 	if (opaque)
    637   1.1  pooka 		*opaque = kev.udata;
    638   1.1  pooka 	return rv;
    639   1.1  pooka }
    640  1.21  pooka 
    641  1.21  pooka #elif defined(__linux__)
    642  1.21  pooka #include <sys/inotify.h>
    643  1.21  pooka 
    644  1.21  pooka int
    645  1.21  pooka rumpuser_writewatchfile_setup(int inotify, int fd, intptr_t notused, int *error)
    646  1.21  pooka {
    647  1.21  pooka 	char procbuf[PATH_MAX], linkbuf[PATH_MAX];
    648  1.21  pooka 	ssize_t nn;
    649  1.21  pooka 
    650  1.21  pooka 	if (inotify == -1) {
    651  1.21  pooka 		inotify = inotify_init();
    652  1.21  pooka 		if (inotify == -1) {
    653  1.21  pooka 			seterror(errno);
    654  1.21  pooka 			return -1;
    655  1.21  pooka 		}
    656  1.21  pooka 	}
    657  1.21  pooka 
    658  1.21  pooka 	/* ok, need to map fd into path for inotify */
    659  1.21  pooka 	snprintf(procbuf, sizeof(procbuf), "/proc/self/fd/%d", fd);
    660  1.21  pooka 	nn = readlink(procbuf, linkbuf, sizeof(linkbuf));
    661  1.21  pooka 	if (nn >= (ssize_t)sizeof(linkbuf)) {
    662  1.21  pooka 		nn = -1;
    663  1.21  pooka 		errno = E2BIG; /* pick something */
    664  1.21  pooka 	}
    665  1.21  pooka 	if (nn == -1) {
    666  1.21  pooka 		seterror(errno);
    667  1.21  pooka 		close(inotify);
    668  1.21  pooka 		return -1;
    669  1.21  pooka 	}
    670  1.21  pooka 
    671  1.21  pooka 	if (inotify_add_watch(inotify, linkbuf, IN_MODIFY) == -1) {
    672  1.21  pooka 		seterror(errno);
    673  1.21  pooka 		close(inotify);
    674  1.21  pooka 		return -1;
    675  1.21  pooka 	}
    676  1.21  pooka 
    677  1.21  pooka 	return inotify;
    678  1.21  pooka }
    679  1.21  pooka 
    680  1.21  pooka int
    681  1.21  pooka rumpuser_writewatchfile_wait(int kq, intptr_t *opaque, int *error)
    682  1.21  pooka {
    683  1.21  pooka 	struct inotify_event iev;
    684  1.21  pooka 	ssize_t nn;
    685  1.21  pooka 
    686  1.21  pooka 	do {
    687  1.21  pooka 		KLOCK_WRAP(nn = read(kq, &iev, sizeof(iev)));
    688  1.21  pooka 	} while (errno == EINTR);
    689  1.21  pooka 
    690  1.21  pooka 	if (nn == -1) {
    691  1.21  pooka 		seterror(errno);
    692  1.21  pooka 		return -1;
    693  1.21  pooka 	}
    694  1.21  pooka 	return (nn/sizeof(iev));
    695  1.21  pooka }
    696  1.18  pooka #endif
    697   1.1  pooka 
    698   1.1  pooka /*
    699   1.1  pooka  * This is meant for safe debugging prints from the kernel.
    700   1.1  pooka  */
    701   1.1  pooka int
    702   1.1  pooka rumpuser_dprintf(const char *format, ...)
    703   1.1  pooka {
    704   1.1  pooka 	va_list ap;
    705   1.1  pooka 	int rv;
    706   1.1  pooka 
    707   1.1  pooka 	va_start(ap, format);
    708   1.9  pooka 	rv = vfprintf(stderr, format, ap);
    709   1.1  pooka 	va_end(ap);
    710   1.1  pooka 
    711   1.1  pooka 	return rv;
    712   1.1  pooka }
    713   1.2  pooka 
    714   1.2  pooka int
    715   1.2  pooka rumpuser_kill(int64_t pid, int sig, int *error)
    716   1.2  pooka {
    717   1.2  pooka 
    718   1.3  pooka #ifdef __NetBSD__
    719   1.2  pooka 	if (pid == RUMPUSER_PID_SELF) {
    720   1.2  pooka 		DOCALL(int, raise(sig));
    721   1.2  pooka 	} else {
    722   1.2  pooka 		DOCALL(int, kill((pid_t)pid, sig));
    723   1.2  pooka 	}
    724   1.3  pooka #else
    725   1.3  pooka 	/* XXXfixme: signal numbers may not match on non-NetBSD */
    726  1.10  pooka 	seterror(EOPNOTSUPP);
    727   1.3  pooka 	return -1;
    728   1.3  pooka #endif
    729   1.2  pooka }
    730   1.4  pooka 
    731   1.4  pooka int
    732   1.4  pooka rumpuser_getnhostcpu(void)
    733   1.4  pooka {
    734  1.18  pooka 	int ncpu = 1;
    735  1.18  pooka 
    736  1.18  pooka #ifdef __NetBSD__
    737   1.4  pooka 	size_t sz = sizeof(ncpu);
    738   1.4  pooka 
    739  1.18  pooka 	sysctlbyname("hw.ncpu", &ncpu, &sz, NULL, 0);
    740  1.18  pooka #elif __linux__
    741  1.18  pooka 	FILE *fp;
    742  1.18  pooka 	char *line = NULL;
    743  1.18  pooka 	size_t n = 0;
    744  1.18  pooka 
    745  1.18  pooka 	/* If anyone knows a better way, I'm all ears */
    746  1.18  pooka 	if ((fp = fopen("/proc/cpuinfo", "r")) != NULL) {
    747  1.18  pooka 		ncpu = 0;
    748  1.18  pooka 		while (getline(&line, &n, fp) != -1) {
    749  1.18  pooka 			if (strncmp(line,
    750  1.18  pooka 			    "processor", sizeof("processor")-1) == 0)
    751  1.18  pooka 			    	ncpu++;
    752  1.18  pooka 		}
    753  1.18  pooka 		if (ncpu == 0)
    754  1.18  pooka 			ncpu = 1;
    755  1.18  pooka 		free(line);
    756  1.18  pooka 		fclose(fp);
    757  1.18  pooka 	}
    758  1.23  pooka #elif __sun__
    759  1.23  pooka 	/* XXX: this is just a rough estimate ... */
    760  1.23  pooka 	ncpu = sysconf(_SC_NPROCESSORS_ONLN);
    761  1.18  pooka #endif
    762  1.18  pooka 
    763   1.4  pooka 	return ncpu;
    764   1.4  pooka }
    765  1.16    tls 
    766  1.18  pooka /* XXX: this hypercall needs a better name */
    767  1.16    tls uint32_t
    768  1.16    tls rumpuser_arc4random(void)
    769  1.16    tls {
    770  1.18  pooka 
    771  1.16    tls 	return arc4random();
    772  1.16    tls }
    773