Home | History | Annotate | Line # | Download | only in libukfs
ukfs.c revision 1.52
      1  1.52     pooka /*	$NetBSD: ukfs.c,v 1.52 2010/07/19 15:35:38 pooka Exp $	*/
      2   1.1     pooka 
      3   1.1     pooka /*
      4  1.38     pooka  * Copyright (c) 2007, 2008, 2009  Antti Kantee.  All Rights Reserved.
      5   1.1     pooka  *
      6   1.1     pooka  * Development of this software was supported by the
      7   1.1     pooka  * Finnish Cultural Foundation.
      8   1.1     pooka  *
      9   1.1     pooka  * Redistribution and use in source and binary forms, with or without
     10   1.1     pooka  * modification, are permitted provided that the following conditions
     11   1.1     pooka  * are met:
     12   1.1     pooka  * 1. Redistributions of source code must retain the above copyright
     13   1.1     pooka  *    notice, this list of conditions and the following disclaimer.
     14   1.1     pooka  * 2. Redistributions in binary form must reproduce the above copyright
     15   1.1     pooka  *    notice, this list of conditions and the following disclaimer in the
     16   1.1     pooka  *    documentation and/or other materials provided with the distribution.
     17   1.1     pooka  *
     18   1.1     pooka  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
     19   1.1     pooka  * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
     20   1.1     pooka  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
     21   1.1     pooka  * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     22   1.1     pooka  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     23   1.1     pooka  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
     24   1.1     pooka  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     25   1.1     pooka  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     26   1.1     pooka  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     27   1.1     pooka  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     28   1.1     pooka  * SUCH DAMAGE.
     29   1.1     pooka  */
     30   1.1     pooka 
     31   1.1     pooka /*
     32   1.1     pooka  * This library enables access to files systems directly without
     33   1.1     pooka  * involving system calls.
     34   1.1     pooka  */
     35   1.1     pooka 
     36   1.1     pooka #ifdef __linux__
     37   1.1     pooka #define _XOPEN_SOURCE 500
     38   1.1     pooka #define _BSD_SOURCE
     39   1.1     pooka #define _FILE_OFFSET_BITS 64
     40   1.1     pooka #endif
     41   1.1     pooka 
     42   1.3     pooka #include <sys/param.h>
     43   1.3     pooka #include <sys/queue.h>
     44   1.1     pooka #include <sys/stat.h>
     45   1.4     pooka #include <sys/sysctl.h>
     46   1.4     pooka #include <sys/mount.h>
     47   1.1     pooka 
     48   1.1     pooka #include <assert.h>
     49   1.3     pooka #include <dirent.h>
     50   1.3     pooka #include <dlfcn.h>
     51   1.1     pooka #include <err.h>
     52   1.1     pooka #include <errno.h>
     53  1.11     pooka #include <fcntl.h>
     54   1.1     pooka #include <pthread.h>
     55   1.1     pooka #include <stdio.h>
     56   1.1     pooka #include <stdlib.h>
     57   1.1     pooka #include <string.h>
     58   1.1     pooka #include <unistd.h>
     59   1.1     pooka #include <stdint.h>
     60   1.1     pooka 
     61   1.1     pooka #include <rump/ukfs.h>
     62   1.1     pooka 
     63   1.1     pooka #include <rump/rump.h>
     64   1.1     pooka #include <rump/rump_syscalls.h>
     65  1.43     pooka #include <rump/rumpuser.h>
     66   1.1     pooka 
     67  1.38     pooka #include "ukfs_int_disklabel.h"
     68  1.38     pooka 
     69   1.1     pooka #define UKFS_MODE_DEFAULT 0555
     70   1.1     pooka 
     71   1.1     pooka struct ukfs {
     72   1.1     pooka 	struct mount *ukfs_mp;
     73   1.1     pooka 	struct vnode *ukfs_rvp;
     74  1.37     pooka 	void *ukfs_specific;
     75   1.1     pooka 
     76   1.1     pooka 	pthread_spinlock_t ukfs_spin;
     77   1.1     pooka 	pid_t ukfs_nextpid;
     78   1.1     pooka 	struct vnode *ukfs_cdir;
     79  1.11     pooka 	int ukfs_devfd;
     80  1.30     pooka 	char *ukfs_devpath;
     81  1.30     pooka 	char *ukfs_mountpath;
     82  1.45     pooka 	struct ukfs_part *ukfs_part;
     83   1.1     pooka };
     84   1.1     pooka 
     85  1.30     pooka static int builddirs(const char *, mode_t,
     86  1.30     pooka     int (*mkdirfn)(struct ukfs *, const char *, mode_t), struct ukfs *);
     87  1.30     pooka 
     88   1.1     pooka struct mount *
     89   1.1     pooka ukfs_getmp(struct ukfs *ukfs)
     90   1.1     pooka {
     91   1.1     pooka 
     92   1.1     pooka 	return ukfs->ukfs_mp;
     93   1.1     pooka }
     94   1.1     pooka 
     95   1.1     pooka struct vnode *
     96   1.1     pooka ukfs_getrvp(struct ukfs *ukfs)
     97   1.1     pooka {
     98   1.1     pooka 	struct vnode *rvp;
     99   1.1     pooka 
    100   1.1     pooka 	rvp = ukfs->ukfs_rvp;
    101  1.40     pooka 	rump_pub_vp_incref(rvp);
    102   1.1     pooka 
    103   1.1     pooka 	return rvp;
    104   1.1     pooka }
    105   1.1     pooka 
    106  1.37     pooka void
    107  1.37     pooka ukfs_setspecific(struct ukfs *ukfs, void *priv)
    108  1.37     pooka {
    109  1.37     pooka 
    110  1.37     pooka 	ukfs->ukfs_specific = priv;
    111  1.37     pooka }
    112  1.37     pooka 
    113  1.37     pooka void *
    114  1.37     pooka ukfs_getspecific(struct ukfs *ukfs)
    115  1.37     pooka {
    116  1.37     pooka 
    117  1.37     pooka 	return ukfs->ukfs_specific;
    118  1.37     pooka }
    119  1.37     pooka 
    120  1.20     pooka #ifdef DONT_WANT_PTHREAD_LINKAGE
    121  1.20     pooka #define pthread_spin_lock(a)
    122  1.20     pooka #define pthread_spin_unlock(a)
    123  1.20     pooka #define pthread_spin_init(a,b)
    124  1.20     pooka #define pthread_spin_destroy(a)
    125  1.20     pooka #endif
    126  1.20     pooka 
    127   1.1     pooka static pid_t
    128   1.1     pooka nextpid(struct ukfs *ukfs)
    129   1.1     pooka {
    130   1.1     pooka 	pid_t npid;
    131   1.1     pooka 
    132   1.1     pooka 	pthread_spin_lock(&ukfs->ukfs_spin);
    133   1.5     pooka 	if (ukfs->ukfs_nextpid == 0)
    134   1.5     pooka 		ukfs->ukfs_nextpid++;
    135   1.1     pooka 	npid = ukfs->ukfs_nextpid++;
    136   1.1     pooka 	pthread_spin_unlock(&ukfs->ukfs_spin);
    137   1.1     pooka 
    138   1.1     pooka 	return npid;
    139   1.1     pooka }
    140   1.1     pooka 
    141   1.1     pooka static void
    142   1.1     pooka precall(struct ukfs *ukfs)
    143   1.1     pooka {
    144   1.1     pooka 	struct vnode *rvp, *cvp;
    145   1.1     pooka 
    146  1.41     pooka 	rump_pub_lwp_alloc_and_switch(nextpid(ukfs), 1);
    147   1.1     pooka 	rvp = ukfs_getrvp(ukfs);
    148   1.1     pooka 	pthread_spin_lock(&ukfs->ukfs_spin);
    149   1.1     pooka 	cvp = ukfs->ukfs_cdir;
    150   1.1     pooka 	pthread_spin_unlock(&ukfs->ukfs_spin);
    151  1.40     pooka 	rump_pub_rcvp_set(rvp, cvp); /* takes refs */
    152  1.40     pooka 	rump_pub_vp_rele(rvp);
    153   1.1     pooka }
    154   1.1     pooka 
    155   1.1     pooka static void
    156   1.1     pooka postcall(struct ukfs *ukfs)
    157   1.1     pooka {
    158   1.1     pooka 	struct vnode *rvp;
    159   1.1     pooka 
    160   1.1     pooka 	rvp = ukfs_getrvp(ukfs);
    161  1.40     pooka 	rump_pub_rcvp_set(NULL, rvp);
    162  1.40     pooka 	rump_pub_vp_rele(rvp);
    163  1.41     pooka 	rump_pub_lwp_release(rump_pub_lwp_curlwp());
    164   1.1     pooka }
    165   1.1     pooka 
    166  1.43     pooka struct ukfs_part {
    167  1.47     pooka 	pthread_spinlock_t part_lck;
    168  1.47     pooka 	int part_refcount;
    169  1.47     pooka 
    170  1.43     pooka 	int part_type;
    171  1.43     pooka 	char part_labelchar;
    172  1.43     pooka 	off_t part_devoff;
    173  1.43     pooka 	off_t part_devsize;
    174  1.43     pooka };
    175  1.43     pooka 
    176  1.43     pooka enum ukfs_parttype { UKFS_PART_NONE, UKFS_PART_DISKLABEL, UKFS_PART_OFFSET };
    177  1.43     pooka 
    178  1.43     pooka static struct ukfs_part ukfs__part_none = {
    179  1.43     pooka 	.part_type = UKFS_PART_NONE,
    180  1.43     pooka 	.part_devoff = 0,
    181  1.43     pooka 	.part_devsize = RUMP_ETFS_SIZE_ENDOFF,
    182  1.43     pooka };
    183  1.43     pooka static struct ukfs_part ukfs__part_na;
    184  1.44     pooka struct ukfs_part *ukfs_part_none = &ukfs__part_none;
    185  1.44     pooka struct ukfs_part *ukfs_part_na = &ukfs__part_na;
    186  1.43     pooka 
    187  1.45     pooka #define PART2LOCKSIZE(len) ((len) == RUMP_ETFS_SIZE_ENDOFF ? 0 : (len))
    188  1.45     pooka 
    189   1.1     pooka int
    190  1.10     pooka _ukfs_init(int version)
    191   1.1     pooka {
    192  1.10     pooka 	int rv;
    193  1.10     pooka 
    194  1.10     pooka 	if (version != UKFS_VERSION) {
    195  1.10     pooka 		printf("incompatible ukfs version, %d vs. %d\n",
    196  1.10     pooka 		    version, UKFS_VERSION);
    197  1.10     pooka 		errno = EPROGMISMATCH;
    198  1.10     pooka 		return -1;
    199  1.10     pooka 	}
    200   1.1     pooka 
    201  1.10     pooka 	if ((rv = rump_init()) != 0) {
    202  1.10     pooka 		errno = rv;
    203  1.10     pooka 		return -1;
    204  1.10     pooka 	}
    205   1.1     pooka 
    206   1.1     pooka 	return 0;
    207   1.1     pooka }
    208   1.1     pooka 
    209  1.31     pooka /*ARGSUSED*/
    210  1.30     pooka static int
    211  1.30     pooka rumpmkdir(struct ukfs *dummy, const char *path, mode_t mode)
    212  1.30     pooka {
    213  1.30     pooka 
    214  1.30     pooka 	return rump_sys_mkdir(path, mode);
    215  1.30     pooka }
    216  1.30     pooka 
    217  1.38     pooka int
    218  1.43     pooka ukfs_part_probe(char *devpath, struct ukfs_part **partp)
    219  1.38     pooka {
    220  1.43     pooka 	struct ukfs_part *part;
    221  1.38     pooka 	char *p;
    222  1.43     pooka 	int error = 0;
    223  1.43     pooka 	int devfd = -1;
    224  1.43     pooka 
    225  1.43     pooka 	if ((p = strstr(devpath, UKFS_PARTITION_SCANMAGIC)) != NULL) {
    226  1.43     pooka 		fprintf(stderr, "ukfs: %%PART is deprecated.  use "
    227  1.43     pooka 		    "%%DISKLABEL instead\n");
    228  1.43     pooka 		errno = ENODEV;
    229  1.43     pooka 		return -1;
    230  1.43     pooka 	}
    231  1.43     pooka 
    232  1.43     pooka 	part = malloc(sizeof(*part));
    233  1.43     pooka 	if (part == NULL) {
    234  1.43     pooka 		errno = ENOMEM;
    235  1.43     pooka 		return -1;
    236  1.43     pooka 	}
    237  1.47     pooka 	if (pthread_spin_init(&part->part_lck, PTHREAD_PROCESS_PRIVATE) == -1) {
    238  1.47     pooka 		error = errno;
    239  1.47     pooka 		free(part);
    240  1.47     pooka 		errno = error;
    241  1.47     pooka 		return -1;
    242  1.47     pooka 	}
    243  1.43     pooka 	part->part_type = UKFS_PART_NONE;
    244  1.47     pooka 	part->part_refcount = 1;
    245  1.38     pooka 
    246  1.38     pooka 	/*
    247  1.43     pooka 	 * Check for magic in pathname:
    248  1.43     pooka 	 *   disklabel: /regularpath%DISKLABEL:labelchar%\0
    249  1.43     pooka 	 *     offsets: /regularpath%OFFSET:start,end%\0
    250  1.38     pooka 	 */
    251  1.43     pooka #define MAGICADJ_DISKLABEL(p, n) (p+sizeof(UKFS_DISKLABEL_SCANMAGIC)-1+n)
    252  1.43     pooka 	if ((p = strstr(devpath, UKFS_DISKLABEL_SCANMAGIC)) != NULL
    253  1.43     pooka 	    && strlen(p) == UKFS_DISKLABEL_MAGICLEN
    254  1.43     pooka 	    && *(MAGICADJ_DISKLABEL(p,1)) == '%') {
    255  1.43     pooka 		if (*(MAGICADJ_DISKLABEL(p,0)) >= 'a' &&
    256  1.43     pooka 		    *(MAGICADJ_DISKLABEL(p,0)) < 'a' + UKFS_MAXPARTITIONS) {
    257  1.43     pooka 			struct ukfs__disklabel dl;
    258  1.43     pooka 			struct ukfs__partition *pp;
    259  1.43     pooka 			char buf[65536];
    260  1.43     pooka 			char labelchar = *(MAGICADJ_DISKLABEL(p,0));
    261  1.43     pooka 			int partition = labelchar - 'a';
    262  1.43     pooka 
    263  1.38     pooka 			*p = '\0';
    264  1.43     pooka 			devfd = open(devpath, O_RDONLY);
    265  1.43     pooka 			if (devfd == -1) {
    266  1.43     pooka 				error = errno;
    267  1.43     pooka 				goto out;
    268  1.43     pooka 			}
    269  1.43     pooka 
    270  1.43     pooka 			/* Locate the disklabel and find the partition. */
    271  1.43     pooka 			if (pread(devfd, buf, sizeof(buf), 0) == -1) {
    272  1.43     pooka 				error = errno;
    273  1.43     pooka 				goto out;
    274  1.43     pooka 			}
    275  1.43     pooka 
    276  1.43     pooka 			if (ukfs__disklabel_scan(&dl, buf, sizeof(buf)) != 0) {
    277  1.43     pooka 				error = ENOENT;
    278  1.43     pooka 				goto out;
    279  1.43     pooka 			}
    280  1.43     pooka 
    281  1.43     pooka 			if (dl.d_npartitions < partition) {
    282  1.43     pooka 				error = ENOENT;
    283  1.43     pooka 				goto out;
    284  1.43     pooka 			}
    285  1.43     pooka 
    286  1.43     pooka 			pp = &dl.d_partitions[partition];
    287  1.43     pooka 			part->part_type = UKFS_PART_DISKLABEL;
    288  1.43     pooka 			part->part_labelchar = labelchar;
    289  1.43     pooka 			part->part_devoff = pp->p_offset << DEV_BSHIFT;
    290  1.43     pooka 			part->part_devsize = pp->p_size << DEV_BSHIFT;
    291  1.38     pooka 		} else {
    292  1.43     pooka 			error = EINVAL;
    293  1.43     pooka 		}
    294  1.43     pooka #define MAGICADJ_OFFSET(p, n) (p+sizeof(UKFS_OFFSET_SCANMAGIC)-1+n)
    295  1.43     pooka 	} else if (((p = strstr(devpath, UKFS_OFFSET_SCANMAGIC)) != NULL)
    296  1.43     pooka 	    && (strlen(p) >= UKFS_OFFSET_MINLEN)) {
    297  1.43     pooka 		char *comma, *pers, *ep, *nptr;
    298  1.43     pooka 		u_quad_t val;
    299  1.43     pooka 
    300  1.43     pooka 		comma = strchr(p, ',');
    301  1.43     pooka 		if (comma == NULL) {
    302  1.43     pooka 			error = EINVAL;
    303  1.43     pooka 			goto out;
    304  1.43     pooka 		}
    305  1.43     pooka 		pers = strchr(comma, '%');
    306  1.43     pooka 		if (pers == NULL) {
    307  1.43     pooka 			error = EINVAL;
    308  1.43     pooka 			goto out;
    309  1.43     pooka 		}
    310  1.43     pooka 		*comma = '\0';
    311  1.43     pooka 		*pers = '\0';
    312  1.43     pooka 		*p = '\0';
    313  1.43     pooka 
    314  1.43     pooka 		nptr = MAGICADJ_OFFSET(p,0);
    315  1.43     pooka 		/* check if string is negative */
    316  1.43     pooka 		if (*nptr == '-') {
    317  1.43     pooka 			error = ERANGE;
    318  1.43     pooka 			goto out;
    319  1.43     pooka 		}
    320  1.43     pooka 		val = strtouq(nptr, &ep, 10);
    321  1.43     pooka 		if (val == UQUAD_MAX) {
    322  1.43     pooka 			error = ERANGE;
    323  1.43     pooka 			goto out;
    324  1.43     pooka 		}
    325  1.43     pooka 		if (*ep != '\0') {
    326  1.43     pooka 			error = EADDRNOTAVAIL; /* creative ;) */
    327  1.43     pooka 			goto out;
    328  1.43     pooka 		}
    329  1.43     pooka 		part->part_devoff = val;
    330  1.43     pooka 
    331  1.43     pooka 		/* omstart */
    332  1.43     pooka 
    333  1.43     pooka 		nptr = comma+1;
    334  1.43     pooka 		/* check if string is negative */
    335  1.43     pooka 		if (*nptr == '-') {
    336  1.43     pooka 			error = ERANGE;
    337  1.43     pooka 			goto out;
    338  1.43     pooka 		}
    339  1.43     pooka 		val = strtouq(nptr, &ep, 10);
    340  1.43     pooka 		if (val == UQUAD_MAX) {
    341  1.43     pooka 			error = ERANGE;
    342  1.43     pooka 			goto out;
    343  1.43     pooka 		}
    344  1.43     pooka 		if (*ep != '\0') {
    345  1.43     pooka 			error = EADDRNOTAVAIL; /* creative ;) */
    346  1.43     pooka 			goto out;
    347  1.38     pooka 		}
    348  1.43     pooka 		part->part_devsize = val;
    349  1.43     pooka 		part->part_type = UKFS_PART_OFFSET;
    350  1.38     pooka 	} else {
    351  1.47     pooka 		ukfs_part_release(part);
    352  1.43     pooka 		part = ukfs_part_none;
    353  1.43     pooka 	}
    354  1.43     pooka 
    355  1.43     pooka  out:
    356  1.43     pooka 	if (devfd != -1)
    357  1.43     pooka 		close(devfd);
    358  1.43     pooka 	if (error) {
    359  1.43     pooka 		free(part);
    360  1.43     pooka 		errno = error;
    361  1.43     pooka 	} else {
    362  1.43     pooka 		*partp = part;
    363  1.43     pooka 	}
    364  1.43     pooka 
    365  1.43     pooka 	return error ? -1 : 0;
    366  1.43     pooka }
    367  1.43     pooka 
    368  1.43     pooka int
    369  1.43     pooka ukfs_part_tostring(struct ukfs_part *part, char *str, size_t strsize)
    370  1.43     pooka {
    371  1.43     pooka 	int rv;
    372  1.43     pooka 
    373  1.43     pooka 	*str = '\0';
    374  1.43     pooka 	/* "pseudo" values */
    375  1.43     pooka 	if (part == ukfs_part_na) {
    376  1.43     pooka 		errno = EINVAL;
    377  1.43     pooka 		return -1;
    378  1.43     pooka 	}
    379  1.43     pooka 	if (part == ukfs_part_none)
    380  1.43     pooka 		return 0;
    381  1.43     pooka 
    382  1.43     pooka 	rv = 0;
    383  1.43     pooka 	switch (part->part_type) {
    384  1.43     pooka 	case UKFS_PART_NONE:
    385  1.43     pooka 		break;
    386  1.43     pooka 
    387  1.43     pooka 	case UKFS_PART_DISKLABEL:
    388  1.43     pooka 		snprintf(str, strsize, "%%DISKLABEL:%c%%",part->part_labelchar);
    389  1.43     pooka 		rv = 1;
    390  1.43     pooka 		break;
    391  1.43     pooka 
    392  1.43     pooka 	case UKFS_PART_OFFSET:
    393  1.43     pooka 		snprintf(str, strsize, "[%llu,%llu]",
    394  1.43     pooka 		    (unsigned long long)part->part_devoff,
    395  1.43     pooka 		    (unsigned long long)(part->part_devoff+part->part_devsize));
    396  1.43     pooka 		rv = 1;
    397  1.43     pooka 		break;
    398  1.38     pooka 	}
    399  1.38     pooka 
    400  1.38     pooka 	return rv;
    401  1.38     pooka }
    402  1.38     pooka 
    403  1.45     pooka static void
    404  1.45     pooka unlockdev(int fd, struct ukfs_part *part)
    405  1.45     pooka {
    406  1.45     pooka 	struct flock flarg;
    407  1.45     pooka 
    408  1.47     pooka 	if (part == ukfs_part_na)
    409  1.47     pooka 		return;
    410  1.47     pooka 
    411  1.45     pooka 	memset(&flarg, 0, sizeof(flarg));
    412  1.45     pooka 	flarg.l_type = F_UNLCK;
    413  1.45     pooka 	flarg.l_whence = SEEK_SET;
    414  1.45     pooka 	flarg.l_start = part->part_devoff;
    415  1.45     pooka 	flarg.l_len = PART2LOCKSIZE(part->part_devsize);
    416  1.45     pooka 	if (fcntl(fd, F_SETLK, &flarg) == -1)
    417  1.45     pooka 		warn("ukfs: cannot unlock device file");
    418  1.45     pooka }
    419  1.45     pooka 
    420  1.38     pooka /*
    421  1.38     pooka  * Open the disk file and flock it.  Also, if we are operation on
    422  1.38     pooka  * an embedded partition, find the partition offset and size from
    423  1.38     pooka  * the disklabel.
    424  1.38     pooka  *
    425  1.38     pooka  * We hard-fail only in two cases:
    426  1.38     pooka  *  1) we failed to get the partition info out (don't know what offset
    427  1.38     pooka  *     to mount from)
    428  1.45     pooka  *  2) we failed to flock the source device (i.e. fcntl() fails,
    429  1.38     pooka  *     not e.g. open() before it)
    430  1.38     pooka  *
    431  1.38     pooka  * Otherwise we let the code proceed to mount and let the file system
    432  1.38     pooka  * throw the proper error.  The only questionable bit is that if we
    433  1.45     pooka  * soft-fail before flock and mount does succeed...
    434  1.38     pooka  *
    435  1.38     pooka  * Returns: -1 error (errno reports error code)
    436  1.38     pooka  *           0 success
    437  1.38     pooka  *
    438  1.38     pooka  * dfdp: -1  device is not open
    439  1.38     pooka  *        n  device is open
    440  1.38     pooka  */
    441  1.38     pooka static int
    442  1.43     pooka process_diskdevice(const char *devpath, struct ukfs_part *part, int rdonly,
    443  1.43     pooka 	int *dfdp)
    444   1.1     pooka {
    445  1.22     pooka 	struct stat sb;
    446  1.38     pooka 	int rv = 0, devfd;
    447  1.38     pooka 
    448  1.38     pooka 	/* defaults */
    449  1.38     pooka 	*dfdp = -1;
    450  1.38     pooka 
    451  1.38     pooka 	devfd = open(devpath, rdonly ? O_RDONLY : O_RDWR);
    452  1.38     pooka 	if (devfd == -1) {
    453  1.43     pooka 		rv = errno;
    454  1.38     pooka 		goto out;
    455  1.38     pooka 	}
    456  1.38     pooka 
    457  1.38     pooka 	if (fstat(devfd, &sb) == -1) {
    458  1.38     pooka 		rv = errno;
    459  1.38     pooka 		goto out;
    460  1.38     pooka 	}
    461   1.1     pooka 
    462  1.11     pooka 	/*
    463  1.38     pooka 	 * We do this only for non-block device since the
    464  1.38     pooka 	 * (NetBSD) kernel allows block device open only once.
    465  1.38     pooka 	 * We also need to close the device for fairly obvious reasons.
    466  1.11     pooka 	 */
    467  1.38     pooka 	if (!S_ISBLK(sb.st_mode)) {
    468  1.45     pooka 		struct flock flarg;
    469  1.45     pooka 
    470  1.45     pooka 		memset(&flarg, 0, sizeof(flarg));
    471  1.45     pooka 		flarg.l_type = rdonly ? F_RDLCK : F_WRLCK;
    472  1.45     pooka 		flarg.l_whence = SEEK_SET;
    473  1.45     pooka 		flarg.l_start = part->part_devoff;
    474  1.45     pooka 		flarg.l_len = PART2LOCKSIZE(part->part_devsize);
    475  1.45     pooka 		if (fcntl(devfd, F_SETLK, &flarg) == -1) {
    476  1.45     pooka 			pid_t holder;
    477  1.45     pooka 			int sverrno;
    478  1.45     pooka 
    479  1.45     pooka 			sverrno = errno;
    480  1.45     pooka 			if (fcntl(devfd, F_GETLK, &flarg) != 1)
    481  1.45     pooka 				holder = flarg.l_pid;
    482  1.45     pooka 			else
    483  1.45     pooka 				holder = -1;
    484  1.45     pooka 			warnx("ukfs_mount: cannot lock device.  held by pid %d",
    485  1.45     pooka 			    holder);
    486  1.45     pooka 			rv = sverrno;
    487  1.11     pooka 			goto out;
    488  1.11     pooka 		}
    489  1.38     pooka 	} else {
    490  1.38     pooka 		close(devfd);
    491  1.38     pooka 		devfd = -1;
    492  1.38     pooka 	}
    493  1.38     pooka 	*dfdp = devfd;
    494  1.22     pooka 
    495  1.38     pooka  out:
    496  1.38     pooka 	if (rv) {
    497  1.38     pooka 		if (devfd != -1)
    498  1.22     pooka 			close(devfd);
    499  1.11     pooka 	}
    500   1.1     pooka 
    501  1.38     pooka 	return rv;
    502  1.38     pooka }
    503  1.38     pooka 
    504  1.49     pooka struct mountinfo {
    505  1.49     pooka 	const char *mi_vfsname;
    506  1.49     pooka 	const char *mi_mountpath;
    507  1.49     pooka 	int mi_mntflags;
    508  1.49     pooka 	void *mi_arg;
    509  1.49     pooka 	size_t mi_alen;
    510  1.49     pooka 	int *mi_error;
    511  1.49     pooka };
    512  1.49     pooka static void *
    513  1.49     pooka mfs_mounter(void *arg)
    514  1.49     pooka {
    515  1.49     pooka 	struct mountinfo *mi = arg;
    516  1.49     pooka 	int rv;
    517  1.49     pooka 
    518  1.49     pooka 	rv = rump_sys_mount(mi->mi_vfsname, mi->mi_mountpath, mi->mi_mntflags,
    519  1.49     pooka 	    mi->mi_arg, mi->mi_alen);
    520  1.49     pooka 	if (rv) {
    521  1.49     pooka 		warn("mfs mount failed.  fix me.");
    522  1.49     pooka 		abort(); /* XXX */
    523  1.49     pooka 	}
    524  1.49     pooka 
    525  1.49     pooka 	return NULL;
    526  1.49     pooka }
    527  1.49     pooka 
    528  1.38     pooka static struct ukfs *
    529  1.43     pooka doukfsmount(const char *vfsname, const char *devpath, struct ukfs_part *part,
    530  1.38     pooka 	const char *mountpath, int mntflags, void *arg, size_t alen)
    531  1.38     pooka {
    532  1.38     pooka 	struct ukfs *fs = NULL;
    533  1.39     pooka 	int rv = 0, devfd = -1;
    534  1.38     pooka 	int mounted = 0;
    535  1.38     pooka 	int regged = 0;
    536  1.38     pooka 
    537  1.47     pooka 	pthread_spin_lock(&part->part_lck);
    538  1.47     pooka 	part->part_refcount++;
    539  1.47     pooka 	pthread_spin_unlock(&part->part_lck);
    540  1.43     pooka 	if (part != ukfs_part_na) {
    541  1.43     pooka 		if ((rv = process_diskdevice(devpath, part,
    542  1.43     pooka 		    mntflags & MNT_RDONLY, &devfd)) != 0)
    543  1.43     pooka 			goto out;
    544  1.43     pooka 	}
    545  1.38     pooka 
    546   1.1     pooka 	fs = malloc(sizeof(struct ukfs));
    547   1.1     pooka 	if (fs == NULL) {
    548   1.1     pooka 		rv = ENOMEM;
    549   1.1     pooka 		goto out;
    550   1.1     pooka 	}
    551   1.1     pooka 	memset(fs, 0, sizeof(struct ukfs));
    552  1.30     pooka 
    553  1.30     pooka 	/* create our mountpoint.  this is never removed. */
    554  1.30     pooka 	if (builddirs(mountpath, 0777, rumpmkdir, NULL) == -1) {
    555  1.30     pooka 		if (errno != EEXIST) {
    556  1.30     pooka 			rv = errno;
    557  1.30     pooka 			goto out;
    558  1.30     pooka 		}
    559  1.30     pooka 	}
    560   1.1     pooka 
    561  1.43     pooka 	if (part != ukfs_part_na) {
    562  1.43     pooka 		/* LINTED */
    563  1.40     pooka 		rv = rump_pub_etfs_register_withsize(devpath, devpath,
    564  1.43     pooka 		    RUMP_ETFS_BLK, part->part_devoff, part->part_devsize);
    565  1.33     pooka 		if (rv) {
    566  1.33     pooka 			goto out;
    567  1.33     pooka 		}
    568  1.33     pooka 		regged = 1;
    569  1.33     pooka 	}
    570  1.38     pooka 
    571  1.49     pooka 	/*
    572  1.49     pooka 	 * MFS is special since mount(2) doesn't return.  Hence, we
    573  1.49     pooka 	 * create a thread here.  Could fix mfs to return, but there's
    574  1.49     pooka 	 * too much history for me to bother.
    575  1.49     pooka 	 */
    576  1.49     pooka 	if (strcmp(vfsname, MOUNT_MFS) == 0) {
    577  1.49     pooka 		pthread_t pt;
    578  1.49     pooka 		struct mountinfo mi;
    579  1.49     pooka 		int i;
    580  1.49     pooka 
    581  1.49     pooka 		mi.mi_vfsname = vfsname;
    582  1.49     pooka 		mi.mi_mountpath = mountpath;
    583  1.49     pooka 		mi.mi_mntflags = mntflags;
    584  1.49     pooka 		mi.mi_arg = arg;
    585  1.49     pooka 		mi.mi_alen = alen;
    586  1.49     pooka 
    587  1.49     pooka 		if (pthread_create(&pt, NULL, mfs_mounter, &mi) == -1) {
    588  1.49     pooka 			rv = errno;
    589  1.49     pooka 			goto out;
    590  1.49     pooka 		}
    591  1.49     pooka 
    592  1.49     pooka 		for (i = 0;i < 100000; i++) {
    593  1.49     pooka 			struct statvfs svfsb;
    594  1.49     pooka 
    595  1.49     pooka 			rv = rump_sys_statvfs1(mountpath, &svfsb, ST_WAIT);
    596  1.49     pooka 			if (rv == -1) {
    597  1.49     pooka 				rv = errno;
    598  1.49     pooka 				goto out;
    599  1.49     pooka 			}
    600  1.49     pooka 
    601  1.49     pooka 			if (strcmp(svfsb.f_mntonname, mountpath) == 0 &&
    602  1.49     pooka 			    strcmp(svfsb.f_fstypename, MOUNT_MFS) == 0) {
    603  1.49     pooka 				break;
    604  1.49     pooka 			}
    605  1.49     pooka 			usleep(1);
    606  1.49     pooka 		}
    607  1.49     pooka 	} else {
    608  1.49     pooka 		rv = rump_sys_mount(vfsname, mountpath, mntflags, arg, alen);
    609  1.49     pooka 		if (rv) {
    610  1.49     pooka 			rv = errno;
    611  1.49     pooka 			goto out;
    612  1.49     pooka 		}
    613   1.1     pooka 	}
    614  1.49     pooka 
    615  1.30     pooka 	mounted = 1;
    616  1.40     pooka 	rv = rump_pub_vfs_getmp(mountpath, &fs->ukfs_mp);
    617  1.11     pooka 	if (rv) {
    618  1.11     pooka 		goto out;
    619  1.11     pooka 	}
    620  1.40     pooka 	rv = rump_pub_vfs_root(fs->ukfs_mp, &fs->ukfs_rvp, 0);
    621  1.30     pooka 	if (rv) {
    622  1.30     pooka 		goto out;
    623  1.30     pooka 	}
    624  1.30     pooka 
    625  1.33     pooka 	if (regged) {
    626  1.33     pooka 		fs->ukfs_devpath = strdup(devpath);
    627  1.33     pooka 	}
    628  1.30     pooka 	fs->ukfs_mountpath = strdup(mountpath);
    629  1.11     pooka 	fs->ukfs_cdir = ukfs_getrvp(fs);
    630  1.11     pooka 	pthread_spin_init(&fs->ukfs_spin, PTHREAD_PROCESS_SHARED);
    631  1.11     pooka 	fs->ukfs_devfd = devfd;
    632  1.45     pooka 	fs->ukfs_part = part;
    633  1.11     pooka 	assert(rv == 0);
    634   1.1     pooka 
    635   1.1     pooka  out:
    636   1.1     pooka 	if (rv) {
    637  1.30     pooka 		if (fs) {
    638  1.30     pooka 			if (fs->ukfs_rvp)
    639  1.40     pooka 				rump_pub_vp_rele(fs->ukfs_rvp);
    640   1.1     pooka 			free(fs);
    641  1.30     pooka 			fs = NULL;
    642  1.30     pooka 		}
    643  1.30     pooka 		if (mounted)
    644  1.30     pooka 			rump_sys_unmount(mountpath, MNT_FORCE);
    645  1.33     pooka 		if (regged)
    646  1.40     pooka 			rump_pub_etfs_remove(devpath);
    647  1.11     pooka 		if (devfd != -1) {
    648  1.46     pooka 			unlockdev(devfd, part);
    649  1.11     pooka 			close(devfd);
    650  1.11     pooka 		}
    651  1.45     pooka 		ukfs_part_release(part);
    652  1.34     pooka 		errno = rv;
    653   1.1     pooka 	}
    654   1.1     pooka 
    655   1.1     pooka 	return fs;
    656   1.1     pooka }
    657   1.1     pooka 
    658  1.38     pooka struct ukfs *
    659  1.38     pooka ukfs_mount(const char *vfsname, const char *devpath,
    660  1.38     pooka 	const char *mountpath, int mntflags, void *arg, size_t alen)
    661  1.38     pooka {
    662  1.38     pooka 
    663  1.43     pooka 	return doukfsmount(vfsname, devpath, ukfs_part_na,
    664  1.38     pooka 	    mountpath, mntflags, arg, alen);
    665  1.38     pooka }
    666  1.38     pooka 
    667  1.38     pooka struct ukfs *
    668  1.43     pooka ukfs_mount_disk(const char *vfsname, const char *devpath,
    669  1.43     pooka 	struct ukfs_part *part, const char *mountpath, int mntflags,
    670  1.43     pooka 	void *arg, size_t alen)
    671  1.38     pooka {
    672  1.38     pooka 
    673  1.43     pooka 	return doukfsmount(vfsname, devpath, part,
    674  1.38     pooka 	    mountpath, mntflags, arg, alen);
    675  1.38     pooka }
    676  1.38     pooka 
    677  1.30     pooka int
    678   1.1     pooka ukfs_release(struct ukfs *fs, int flags)
    679   1.1     pooka {
    680   1.1     pooka 
    681   1.1     pooka 	if ((flags & UKFS_RELFLAG_NOUNMOUNT) == 0) {
    682  1.37     pooka 		int rv, mntflag, error;
    683   1.9     pooka 
    684  1.30     pooka 		ukfs_chdir(fs, "/");
    685  1.30     pooka 		mntflag = 0;
    686  1.30     pooka 		if (flags & UKFS_RELFLAG_FORCE)
    687  1.30     pooka 			mntflag = MNT_FORCE;
    688  1.41     pooka 		rump_pub_lwp_alloc_and_switch(nextpid(fs), 1);
    689  1.40     pooka 		rump_pub_vp_rele(fs->ukfs_rvp);
    690  1.37     pooka 		fs->ukfs_rvp = NULL;
    691  1.30     pooka 		rv = rump_sys_unmount(fs->ukfs_mountpath, mntflag);
    692  1.37     pooka 		if (rv == -1) {
    693  1.37     pooka 			error = errno;
    694  1.40     pooka 			rump_pub_vfs_root(fs->ukfs_mp, &fs->ukfs_rvp, 0);
    695  1.41     pooka 			rump_pub_lwp_release(rump_pub_lwp_curlwp());
    696  1.30     pooka 			ukfs_chdir(fs, fs->ukfs_mountpath);
    697  1.37     pooka 			errno = error;
    698  1.30     pooka 			return -1;
    699  1.30     pooka 		}
    700  1.41     pooka 		rump_pub_lwp_release(rump_pub_lwp_curlwp());
    701   1.1     pooka 	}
    702   1.1     pooka 
    703  1.33     pooka 	if (fs->ukfs_devpath) {
    704  1.40     pooka 		rump_pub_etfs_remove(fs->ukfs_devpath);
    705  1.33     pooka 		free(fs->ukfs_devpath);
    706  1.33     pooka 	}
    707  1.30     pooka 	free(fs->ukfs_mountpath);
    708   1.1     pooka 
    709   1.1     pooka 	pthread_spin_destroy(&fs->ukfs_spin);
    710  1.16  stacktic 	if (fs->ukfs_devfd != -1) {
    711  1.45     pooka 		unlockdev(fs->ukfs_devfd, fs->ukfs_part);
    712  1.16  stacktic 		close(fs->ukfs_devfd);
    713  1.16  stacktic 	}
    714  1.47     pooka 	ukfs_part_release(fs->ukfs_part);
    715   1.1     pooka 	free(fs);
    716  1.30     pooka 
    717  1.30     pooka 	return 0;
    718   1.1     pooka }
    719   1.1     pooka 
    720  1.43     pooka void
    721  1.43     pooka ukfs_part_release(struct ukfs_part *part)
    722  1.43     pooka {
    723  1.47     pooka 	int release;
    724  1.43     pooka 
    725  1.47     pooka 	if (part != ukfs_part_none && part != ukfs_part_na) {
    726  1.47     pooka 		pthread_spin_lock(&part->part_lck);
    727  1.47     pooka 		release = --part->part_refcount == 0;
    728  1.47     pooka 		pthread_spin_unlock(&part->part_lck);
    729  1.47     pooka 		if (release) {
    730  1.47     pooka 			pthread_spin_destroy(&part->part_lck);
    731  1.47     pooka 			free(part);
    732  1.47     pooka 		}
    733  1.47     pooka 	}
    734  1.43     pooka }
    735  1.43     pooka 
    736   1.1     pooka #define STDCALL(ukfs, thecall)						\
    737   1.1     pooka 	int rv = 0;							\
    738   1.1     pooka 									\
    739   1.1     pooka 	precall(ukfs);							\
    740  1.21     pooka 	rv = thecall;							\
    741   1.1     pooka 	postcall(ukfs);							\
    742  1.21     pooka 	return rv;
    743   1.1     pooka 
    744   1.1     pooka int
    745  1.24     pooka ukfs_opendir(struct ukfs *ukfs, const char *dirname, struct ukfs_dircookie **c)
    746   1.1     pooka {
    747   1.1     pooka 	struct vnode *vp;
    748  1.24     pooka 	int rv;
    749   1.1     pooka 
    750   1.1     pooka 	precall(ukfs);
    751  1.40     pooka 	rv = rump_pub_namei(RUMP_NAMEI_LOOKUP, RUMP_NAMEI_LOCKLEAF, dirname,
    752   1.1     pooka 	    NULL, &vp, NULL);
    753   1.1     pooka 	postcall(ukfs);
    754  1.24     pooka 
    755  1.24     pooka 	if (rv == 0) {
    756  1.51   hannken 		RUMP_VOP_UNLOCK(vp);
    757  1.24     pooka 	} else {
    758  1.24     pooka 		errno = rv;
    759  1.24     pooka 		rv = -1;
    760  1.24     pooka 	}
    761  1.24     pooka 
    762  1.24     pooka 	/*LINTED*/
    763  1.24     pooka 	*c = (struct ukfs_dircookie *)vp;
    764  1.24     pooka 	return rv;
    765  1.24     pooka }
    766  1.24     pooka 
    767  1.24     pooka static int
    768  1.24     pooka getmydents(struct vnode *vp, off_t *off, uint8_t *buf, size_t bufsize)
    769  1.24     pooka {
    770  1.24     pooka 	struct uio *uio;
    771  1.24     pooka 	size_t resid;
    772  1.24     pooka 	int rv, eofflag;
    773  1.50     pooka 	struct kauth_cred *cred;
    774  1.24     pooka 
    775  1.40     pooka 	uio = rump_pub_uio_setup(buf, bufsize, *off, RUMPUIO_READ);
    776  1.40     pooka 	cred = rump_pub_cred_suserget();
    777   1.9     pooka 	rv = RUMP_VOP_READDIR(vp, uio, cred, &eofflag, NULL, NULL);
    778  1.40     pooka 	rump_pub_cred_put(cred);
    779  1.51   hannken 	RUMP_VOP_UNLOCK(vp);
    780  1.40     pooka 	*off = rump_pub_uio_getoff(uio);
    781  1.40     pooka 	resid = rump_pub_uio_free(uio);
    782   1.1     pooka 
    783   1.1     pooka 	if (rv) {
    784   1.1     pooka 		errno = rv;
    785   1.1     pooka 		return -1;
    786   1.1     pooka 	}
    787   1.1     pooka 
    788   1.1     pooka 	/* LINTED: not totally correct return type, but follows syscall */
    789   1.1     pooka 	return bufsize - resid;
    790   1.1     pooka }
    791   1.1     pooka 
    792  1.24     pooka /*ARGSUSED*/
    793  1.24     pooka int
    794  1.24     pooka ukfs_getdents_cookie(struct ukfs *ukfs, struct ukfs_dircookie *c, off_t *off,
    795  1.24     pooka 	uint8_t *buf, size_t bufsize)
    796  1.24     pooka {
    797  1.24     pooka 	/*LINTED*/
    798  1.24     pooka 	struct vnode *vp = (struct vnode *)c;
    799  1.24     pooka 
    800  1.24     pooka 	RUMP_VOP_LOCK(vp, RUMP_LK_SHARED);
    801  1.24     pooka 	return getmydents(vp, off, buf, bufsize);
    802  1.24     pooka }
    803  1.24     pooka 
    804  1.24     pooka int
    805  1.24     pooka ukfs_getdents(struct ukfs *ukfs, const char *dirname, off_t *off,
    806  1.24     pooka 	uint8_t *buf, size_t bufsize)
    807  1.24     pooka {
    808  1.24     pooka 	struct vnode *vp;
    809  1.24     pooka 	int rv;
    810  1.24     pooka 
    811  1.24     pooka 	precall(ukfs);
    812  1.40     pooka 	rv = rump_pub_namei(RUMP_NAMEI_LOOKUP, RUMP_NAMEI_LOCKLEAF, dirname,
    813  1.24     pooka 	    NULL, &vp, NULL);
    814  1.24     pooka 	postcall(ukfs);
    815  1.24     pooka 	if (rv) {
    816  1.24     pooka 		errno = rv;
    817  1.24     pooka 		return -1;
    818  1.24     pooka 	}
    819  1.24     pooka 
    820  1.24     pooka 	rv = getmydents(vp, off, buf, bufsize);
    821  1.40     pooka 	rump_pub_vp_rele(vp);
    822  1.24     pooka 	return rv;
    823  1.24     pooka }
    824  1.24     pooka 
    825  1.24     pooka /*ARGSUSED*/
    826  1.24     pooka int
    827  1.24     pooka ukfs_closedir(struct ukfs *ukfs, struct ukfs_dircookie *c)
    828  1.24     pooka {
    829  1.24     pooka 
    830  1.24     pooka 	/*LINTED*/
    831  1.40     pooka 	rump_pub_vp_rele((struct vnode *)c);
    832  1.24     pooka 	return 0;
    833  1.24     pooka }
    834  1.24     pooka 
    835  1.24     pooka int
    836  1.24     pooka ukfs_open(struct ukfs *ukfs, const char *filename, int flags)
    837  1.24     pooka {
    838  1.24     pooka 	int fd;
    839  1.24     pooka 
    840  1.24     pooka 	precall(ukfs);
    841  1.24     pooka 	fd = rump_sys_open(filename, flags, 0);
    842  1.24     pooka 	postcall(ukfs);
    843  1.24     pooka 	if (fd == -1)
    844  1.24     pooka 		return -1;
    845  1.24     pooka 
    846  1.24     pooka 	return fd;
    847  1.24     pooka }
    848  1.24     pooka 
    849   1.1     pooka ssize_t
    850   1.1     pooka ukfs_read(struct ukfs *ukfs, const char *filename, off_t off,
    851   1.1     pooka 	uint8_t *buf, size_t bufsize)
    852   1.1     pooka {
    853  1.21     pooka 	int fd;
    854   1.1     pooka 	ssize_t xfer = -1; /* XXXgcc */
    855   1.1     pooka 
    856   1.1     pooka 	precall(ukfs);
    857  1.21     pooka 	fd = rump_sys_open(filename, RUMP_O_RDONLY, 0);
    858  1.21     pooka 	if (fd == -1)
    859   1.1     pooka 		goto out;
    860   1.1     pooka 
    861  1.27     pooka 	xfer = rump_sys_pread(fd, buf, bufsize, off);
    862  1.21     pooka 	rump_sys_close(fd);
    863   1.1     pooka 
    864   1.1     pooka  out:
    865   1.1     pooka 	postcall(ukfs);
    866  1.21     pooka 	if (fd == -1) {
    867   1.1     pooka 		return -1;
    868   1.1     pooka 	}
    869   1.1     pooka 	return xfer;
    870   1.1     pooka }
    871   1.1     pooka 
    872  1.24     pooka /*ARGSUSED*/
    873  1.24     pooka ssize_t
    874  1.24     pooka ukfs_read_fd(struct ukfs *ukfs, int fd, off_t off, uint8_t *buf, size_t buflen)
    875  1.24     pooka {
    876  1.24     pooka 
    877  1.27     pooka 	return rump_sys_pread(fd, buf, buflen, off);
    878  1.24     pooka }
    879  1.24     pooka 
    880   1.1     pooka ssize_t
    881   1.1     pooka ukfs_write(struct ukfs *ukfs, const char *filename, off_t off,
    882   1.1     pooka 	uint8_t *buf, size_t bufsize)
    883   1.1     pooka {
    884  1.21     pooka 	int fd;
    885   1.1     pooka 	ssize_t xfer = -1; /* XXXgcc */
    886   1.1     pooka 
    887   1.1     pooka 	precall(ukfs);
    888  1.21     pooka 	fd = rump_sys_open(filename, RUMP_O_WRONLY, 0);
    889  1.21     pooka 	if (fd == -1)
    890   1.1     pooka 		goto out;
    891   1.1     pooka 
    892   1.1     pooka 	/* write and commit */
    893  1.27     pooka 	xfer = rump_sys_pwrite(fd, buf, bufsize, off);
    894  1.21     pooka 	if (xfer > 0)
    895  1.21     pooka 		rump_sys_fsync(fd);
    896   1.1     pooka 
    897  1.21     pooka 	rump_sys_close(fd);
    898   1.1     pooka 
    899   1.1     pooka  out:
    900   1.1     pooka 	postcall(ukfs);
    901  1.21     pooka 	if (fd == -1) {
    902   1.1     pooka 		return -1;
    903   1.1     pooka 	}
    904   1.1     pooka 	return xfer;
    905   1.1     pooka }
    906   1.1     pooka 
    907  1.24     pooka /*ARGSUSED*/
    908  1.24     pooka ssize_t
    909  1.24     pooka ukfs_write_fd(struct ukfs *ukfs, int fd, off_t off, uint8_t *buf, size_t buflen,
    910  1.24     pooka 	int dosync)
    911  1.24     pooka {
    912  1.24     pooka 	ssize_t xfer;
    913  1.24     pooka 
    914  1.27     pooka 	xfer = rump_sys_pwrite(fd, buf, buflen, off);
    915  1.24     pooka 	if (xfer > 0 && dosync)
    916  1.24     pooka 		rump_sys_fsync(fd);
    917  1.24     pooka 
    918  1.24     pooka 	return xfer;
    919  1.24     pooka }
    920  1.24     pooka 
    921  1.24     pooka /*ARGSUSED*/
    922  1.24     pooka int
    923  1.24     pooka ukfs_close(struct ukfs *ukfs, int fd)
    924  1.24     pooka {
    925  1.24     pooka 
    926  1.24     pooka 	rump_sys_close(fd);
    927  1.24     pooka 	return 0;
    928  1.24     pooka }
    929  1.24     pooka 
    930   1.1     pooka int
    931   1.1     pooka ukfs_create(struct ukfs *ukfs, const char *filename, mode_t mode)
    932   1.1     pooka {
    933  1.21     pooka 	int fd;
    934   1.1     pooka 
    935   1.1     pooka 	precall(ukfs);
    936  1.21     pooka 	fd = rump_sys_open(filename, RUMP_O_WRONLY | RUMP_O_CREAT, mode);
    937  1.21     pooka 	if (fd == -1)
    938  1.21     pooka 		return -1;
    939  1.21     pooka 	rump_sys_close(fd);
    940   1.1     pooka 
    941   1.1     pooka 	postcall(ukfs);
    942   1.1     pooka 	return 0;
    943   1.1     pooka }
    944   1.1     pooka 
    945   1.1     pooka int
    946   1.1     pooka ukfs_mknod(struct ukfs *ukfs, const char *path, mode_t mode, dev_t dev)
    947   1.1     pooka {
    948   1.1     pooka 
    949  1.21     pooka 	STDCALL(ukfs, rump_sys_mknod(path, mode, dev));
    950   1.1     pooka }
    951   1.1     pooka 
    952   1.1     pooka int
    953   1.1     pooka ukfs_mkfifo(struct ukfs *ukfs, const char *path, mode_t mode)
    954   1.1     pooka {
    955   1.1     pooka 
    956  1.21     pooka 	STDCALL(ukfs, rump_sys_mkfifo(path, mode));
    957   1.1     pooka }
    958   1.1     pooka 
    959   1.1     pooka int
    960   1.1     pooka ukfs_mkdir(struct ukfs *ukfs, const char *filename, mode_t mode)
    961   1.1     pooka {
    962   1.1     pooka 
    963  1.21     pooka 	STDCALL(ukfs, rump_sys_mkdir(filename, mode));
    964   1.1     pooka }
    965   1.1     pooka 
    966   1.1     pooka int
    967   1.1     pooka ukfs_remove(struct ukfs *ukfs, const char *filename)
    968   1.1     pooka {
    969   1.1     pooka 
    970  1.21     pooka 	STDCALL(ukfs, rump_sys_unlink(filename));
    971   1.1     pooka }
    972   1.1     pooka 
    973   1.1     pooka int
    974   1.1     pooka ukfs_rmdir(struct ukfs *ukfs, const char *filename)
    975   1.1     pooka {
    976   1.1     pooka 
    977  1.21     pooka 	STDCALL(ukfs, rump_sys_rmdir(filename));
    978   1.1     pooka }
    979   1.1     pooka 
    980   1.1     pooka int
    981   1.1     pooka ukfs_link(struct ukfs *ukfs, const char *filename, const char *f_create)
    982   1.1     pooka {
    983   1.1     pooka 
    984  1.21     pooka 	STDCALL(ukfs, rump_sys_link(filename, f_create));
    985   1.1     pooka }
    986   1.1     pooka 
    987   1.1     pooka int
    988   1.1     pooka ukfs_symlink(struct ukfs *ukfs, const char *filename, const char *linkname)
    989   1.1     pooka {
    990   1.1     pooka 
    991  1.21     pooka 	STDCALL(ukfs, rump_sys_symlink(filename, linkname));
    992   1.1     pooka }
    993   1.1     pooka 
    994   1.1     pooka ssize_t
    995   1.1     pooka ukfs_readlink(struct ukfs *ukfs, const char *filename,
    996   1.1     pooka 	char *linkbuf, size_t buflen)
    997   1.1     pooka {
    998   1.1     pooka 	ssize_t rv;
    999   1.1     pooka 
   1000   1.1     pooka 	precall(ukfs);
   1001  1.21     pooka 	rv = rump_sys_readlink(filename, linkbuf, buflen);
   1002   1.1     pooka 	postcall(ukfs);
   1003   1.1     pooka 	return rv;
   1004   1.1     pooka }
   1005   1.1     pooka 
   1006   1.1     pooka int
   1007   1.1     pooka ukfs_rename(struct ukfs *ukfs, const char *from, const char *to)
   1008   1.1     pooka {
   1009   1.1     pooka 
   1010  1.21     pooka 	STDCALL(ukfs, rump_sys_rename(from, to));
   1011   1.1     pooka }
   1012   1.1     pooka 
   1013   1.1     pooka int
   1014   1.1     pooka ukfs_chdir(struct ukfs *ukfs, const char *path)
   1015   1.1     pooka {
   1016   1.1     pooka 	struct vnode *newvp, *oldvp;
   1017   1.1     pooka 	int rv;
   1018   1.1     pooka 
   1019   1.1     pooka 	precall(ukfs);
   1020  1.21     pooka 	rv = rump_sys_chdir(path);
   1021  1.21     pooka 	if (rv == -1)
   1022   1.1     pooka 		goto out;
   1023   1.1     pooka 
   1024  1.40     pooka 	newvp = rump_pub_cdir_get();
   1025   1.1     pooka 	pthread_spin_lock(&ukfs->ukfs_spin);
   1026   1.1     pooka 	oldvp = ukfs->ukfs_cdir;
   1027   1.1     pooka 	ukfs->ukfs_cdir = newvp;
   1028   1.1     pooka 	pthread_spin_unlock(&ukfs->ukfs_spin);
   1029   1.1     pooka 	if (oldvp)
   1030  1.40     pooka 		rump_pub_vp_rele(oldvp);
   1031   1.1     pooka 
   1032   1.1     pooka  out:
   1033   1.1     pooka 	postcall(ukfs);
   1034  1.21     pooka 	return rv;
   1035   1.1     pooka }
   1036   1.1     pooka 
   1037   1.1     pooka int
   1038   1.1     pooka ukfs_stat(struct ukfs *ukfs, const char *filename, struct stat *file_stat)
   1039   1.1     pooka {
   1040  1.28     pooka 	int rv;
   1041   1.1     pooka 
   1042  1.28     pooka 	precall(ukfs);
   1043  1.52     pooka 	rv = rump_sys_stat(filename, file_stat);
   1044  1.28     pooka 	postcall(ukfs);
   1045  1.28     pooka 
   1046  1.28     pooka 	return rv;
   1047   1.1     pooka }
   1048   1.1     pooka 
   1049   1.1     pooka int
   1050   1.1     pooka ukfs_lstat(struct ukfs *ukfs, const char *filename, struct stat *file_stat)
   1051   1.1     pooka {
   1052  1.28     pooka 	int rv;
   1053   1.1     pooka 
   1054  1.28     pooka 	precall(ukfs);
   1055  1.52     pooka 	rv = rump_sys_lstat(filename, file_stat);
   1056  1.28     pooka 	postcall(ukfs);
   1057  1.28     pooka 
   1058  1.28     pooka 	return rv;
   1059   1.1     pooka }
   1060   1.1     pooka 
   1061   1.1     pooka int
   1062   1.1     pooka ukfs_chmod(struct ukfs *ukfs, const char *filename, mode_t mode)
   1063   1.1     pooka {
   1064   1.1     pooka 
   1065  1.21     pooka 	STDCALL(ukfs, rump_sys_chmod(filename, mode));
   1066   1.1     pooka }
   1067   1.1     pooka 
   1068   1.1     pooka int
   1069   1.1     pooka ukfs_lchmod(struct ukfs *ukfs, const char *filename, mode_t mode)
   1070   1.1     pooka {
   1071   1.1     pooka 
   1072  1.21     pooka 	STDCALL(ukfs, rump_sys_lchmod(filename, mode));
   1073   1.1     pooka }
   1074   1.1     pooka 
   1075   1.1     pooka int
   1076   1.1     pooka ukfs_chown(struct ukfs *ukfs, const char *filename, uid_t uid, gid_t gid)
   1077   1.1     pooka {
   1078   1.1     pooka 
   1079  1.21     pooka 	STDCALL(ukfs, rump_sys_chown(filename, uid, gid));
   1080   1.1     pooka }
   1081   1.1     pooka 
   1082   1.1     pooka int
   1083   1.1     pooka ukfs_lchown(struct ukfs *ukfs, const char *filename, uid_t uid, gid_t gid)
   1084   1.1     pooka {
   1085   1.1     pooka 
   1086  1.21     pooka 	STDCALL(ukfs, rump_sys_lchown(filename, uid, gid));
   1087   1.1     pooka }
   1088   1.1     pooka 
   1089   1.1     pooka int
   1090   1.1     pooka ukfs_chflags(struct ukfs *ukfs, const char *filename, u_long flags)
   1091   1.1     pooka {
   1092   1.1     pooka 
   1093  1.21     pooka 	STDCALL(ukfs, rump_sys_chflags(filename, flags));
   1094   1.1     pooka }
   1095   1.1     pooka 
   1096   1.1     pooka int
   1097   1.1     pooka ukfs_lchflags(struct ukfs *ukfs, const char *filename, u_long flags)
   1098   1.1     pooka {
   1099   1.1     pooka 
   1100  1.21     pooka 	STDCALL(ukfs, rump_sys_lchflags(filename, flags));
   1101   1.1     pooka }
   1102   1.1     pooka 
   1103   1.1     pooka int
   1104   1.1     pooka ukfs_utimes(struct ukfs *ukfs, const char *filename, const struct timeval *tptr)
   1105   1.1     pooka {
   1106   1.1     pooka 
   1107  1.21     pooka 	STDCALL(ukfs, rump_sys_utimes(filename, tptr));
   1108   1.1     pooka }
   1109   1.1     pooka 
   1110   1.1     pooka int
   1111   1.1     pooka ukfs_lutimes(struct ukfs *ukfs, const char *filename,
   1112   1.1     pooka 	      const struct timeval *tptr)
   1113   1.1     pooka {
   1114   1.1     pooka 
   1115  1.21     pooka 	STDCALL(ukfs, rump_sys_lutimes(filename, tptr));
   1116   1.1     pooka }
   1117   1.1     pooka 
   1118   1.3     pooka /*
   1119   1.3     pooka  * Dynamic module support
   1120   1.3     pooka  */
   1121   1.3     pooka 
   1122   1.3     pooka /* load one library */
   1123   1.3     pooka 
   1124   1.3     pooka /*
   1125   1.3     pooka  * XXX: the dlerror stuff isn't really threadsafe, but then again I
   1126   1.3     pooka  * can't protect against other threads calling dl*() outside of ukfs,
   1127   1.3     pooka  * so just live with it being flimsy
   1128   1.3     pooka  */
   1129   1.3     pooka int
   1130   1.3     pooka ukfs_modload(const char *fname)
   1131   1.3     pooka {
   1132  1.26     pooka 	void *handle;
   1133  1.48     pooka 	const struct modinfo *const *mi_start, *const *mi_end;
   1134   1.3     pooka 	int error;
   1135   1.3     pooka 
   1136  1.42     njoly 	handle = dlopen(fname, RTLD_LAZY|RTLD_GLOBAL);
   1137   1.3     pooka 	if (handle == NULL) {
   1138  1.13     pooka 		const char *dlmsg = dlerror();
   1139  1.13     pooka 		if (strstr(dlmsg, "Undefined symbol"))
   1140   1.3     pooka 			return 0;
   1141  1.13     pooka 		warnx("dlopen %s failed: %s\n", fname, dlmsg);
   1142   1.3     pooka 		/* XXXerrno */
   1143   1.3     pooka 		return -1;
   1144   1.3     pooka 	}
   1145   1.3     pooka 
   1146  1.48     pooka 	mi_start = dlsym(handle, "__start_link_set_modules");
   1147  1.48     pooka 	mi_end = dlsym(handle, "__stop_link_set_modules");
   1148  1.48     pooka 	if (mi_start && mi_end) {
   1149  1.48     pooka 		error = rump_pub_module_init(mi_start,
   1150  1.48     pooka 		    (size_t)(mi_end-mi_start));
   1151   1.3     pooka 		if (error)
   1152   1.3     pooka 			goto errclose;
   1153   1.3     pooka 		return 1;
   1154   1.3     pooka 	}
   1155   1.3     pooka 	error = EINVAL;
   1156   1.3     pooka 
   1157   1.3     pooka  errclose:
   1158   1.3     pooka 	dlclose(handle);
   1159   1.3     pooka 	errno = error;
   1160   1.3     pooka 	return -1;
   1161   1.3     pooka }
   1162   1.3     pooka 
   1163   1.3     pooka struct loadfail {
   1164   1.3     pooka 	char *pname;
   1165   1.3     pooka 
   1166   1.3     pooka 	LIST_ENTRY(loadfail) entries;
   1167   1.3     pooka };
   1168   1.3     pooka 
   1169   1.3     pooka #define RUMPFSMOD_PREFIX "librumpfs_"
   1170   1.3     pooka #define RUMPFSMOD_SUFFIX ".so"
   1171   1.3     pooka 
   1172   1.3     pooka int
   1173   1.3     pooka ukfs_modload_dir(const char *dir)
   1174   1.3     pooka {
   1175   1.3     pooka 	char nbuf[MAXPATHLEN+1], *p;
   1176   1.3     pooka 	struct dirent entry, *result;
   1177   1.3     pooka 	DIR *libdir;
   1178   1.3     pooka 	struct loadfail *lf, *nlf;
   1179   1.3     pooka 	int error, nloaded = 0, redo;
   1180   1.3     pooka 	LIST_HEAD(, loadfail) lfs;
   1181   1.3     pooka 
   1182   1.3     pooka 	libdir = opendir(dir);
   1183   1.3     pooka 	if (libdir == NULL)
   1184   1.3     pooka 		return -1;
   1185   1.3     pooka 
   1186   1.3     pooka 	LIST_INIT(&lfs);
   1187   1.3     pooka 	for (;;) {
   1188   1.3     pooka 		if ((error = readdir_r(libdir, &entry, &result)) != 0)
   1189   1.3     pooka 			break;
   1190   1.3     pooka 		if (!result)
   1191   1.3     pooka 			break;
   1192   1.3     pooka 		if (strncmp(result->d_name, RUMPFSMOD_PREFIX,
   1193   1.3     pooka 		    strlen(RUMPFSMOD_PREFIX)) != 0)
   1194   1.3     pooka 			continue;
   1195   1.3     pooka 		if (((p = strstr(result->d_name, RUMPFSMOD_SUFFIX)) == NULL)
   1196   1.3     pooka 		    || strlen(p) != strlen(RUMPFSMOD_SUFFIX))
   1197   1.3     pooka 			continue;
   1198   1.3     pooka 		strlcpy(nbuf, dir, sizeof(nbuf));
   1199   1.3     pooka 		strlcat(nbuf, "/", sizeof(nbuf));
   1200   1.3     pooka 		strlcat(nbuf, result->d_name, sizeof(nbuf));
   1201   1.3     pooka 		switch (ukfs_modload(nbuf)) {
   1202   1.3     pooka 		case 0:
   1203   1.3     pooka 			lf = malloc(sizeof(*lf));
   1204   1.3     pooka 			if (lf == NULL) {
   1205   1.3     pooka 				error = ENOMEM;
   1206   1.3     pooka 				break;
   1207   1.3     pooka 			}
   1208   1.3     pooka 			lf->pname = strdup(nbuf);
   1209   1.3     pooka 			if (lf->pname == NULL) {
   1210   1.3     pooka 				free(lf);
   1211   1.3     pooka 				error = ENOMEM;
   1212   1.3     pooka 				break;
   1213   1.3     pooka 			}
   1214   1.3     pooka 			LIST_INSERT_HEAD(&lfs, lf, entries);
   1215   1.3     pooka 			break;
   1216   1.3     pooka 		case 1:
   1217   1.3     pooka 			nloaded++;
   1218   1.3     pooka 			break;
   1219   1.3     pooka 		default:
   1220   1.3     pooka 			/* ignore errors */
   1221   1.3     pooka 			break;
   1222   1.3     pooka 		}
   1223   1.3     pooka 	}
   1224   1.3     pooka 	closedir(libdir);
   1225   1.3     pooka 	if (error && nloaded != 0)
   1226   1.3     pooka 		error = 0;
   1227   1.3     pooka 
   1228   1.3     pooka 	/*
   1229   1.3     pooka 	 * El-cheapo dependency calculator.  Just try to load the
   1230   1.3     pooka 	 * modules n times in a loop
   1231   1.3     pooka 	 */
   1232   1.3     pooka 	for (redo = 1; redo;) {
   1233   1.3     pooka 		redo = 0;
   1234   1.3     pooka 		nlf = LIST_FIRST(&lfs);
   1235   1.3     pooka 		while ((lf = nlf) != NULL) {
   1236   1.3     pooka 			nlf = LIST_NEXT(lf, entries);
   1237   1.3     pooka 			if (ukfs_modload(lf->pname) == 1) {
   1238   1.3     pooka 				nloaded++;
   1239   1.3     pooka 				redo = 1;
   1240   1.3     pooka 				LIST_REMOVE(lf, entries);
   1241   1.3     pooka 				free(lf->pname);
   1242   1.3     pooka 				free(lf);
   1243   1.3     pooka 			}
   1244   1.3     pooka 		}
   1245   1.3     pooka 	}
   1246   1.3     pooka 
   1247   1.3     pooka 	while ((lf = LIST_FIRST(&lfs)) != NULL) {
   1248   1.3     pooka 		LIST_REMOVE(lf, entries);
   1249   1.3     pooka 		free(lf->pname);
   1250   1.3     pooka 		free(lf);
   1251   1.3     pooka 	}
   1252   1.3     pooka 
   1253   1.3     pooka 	if (error && nloaded == 0) {
   1254   1.3     pooka 		errno = error;
   1255   1.3     pooka 		return -1;
   1256   1.3     pooka 	}
   1257   1.3     pooka 
   1258   1.3     pooka 	return nloaded;
   1259   1.3     pooka }
   1260   1.3     pooka 
   1261   1.4     pooka /* XXX: this code uses definitions from NetBSD, needs rumpdefs */
   1262   1.4     pooka ssize_t
   1263   1.4     pooka ukfs_vfstypes(char *buf, size_t buflen)
   1264   1.4     pooka {
   1265   1.4     pooka 	int mib[3];
   1266   1.4     pooka 	struct sysctlnode q, ans[128];
   1267   1.4     pooka 	size_t alen;
   1268  1.21     pooka 	int i;
   1269   1.4     pooka 
   1270   1.4     pooka 	mib[0] = CTL_VFS;
   1271   1.4     pooka 	mib[1] = VFS_GENERIC;
   1272   1.4     pooka 	mib[2] = CTL_QUERY;
   1273   1.4     pooka 	alen = sizeof(ans);
   1274   1.4     pooka 
   1275   1.4     pooka 	memset(&q, 0, sizeof(q));
   1276   1.4     pooka 	q.sysctl_flags = SYSCTL_VERSION;
   1277   1.4     pooka 
   1278  1.21     pooka 	if (rump_sys___sysctl(mib, 3, ans, &alen, &q, sizeof(q)) == -1) {
   1279   1.4     pooka 		return -1;
   1280   1.4     pooka 	}
   1281   1.4     pooka 
   1282   1.4     pooka 	for (i = 0; i < alen/sizeof(ans[0]); i++)
   1283   1.4     pooka 		if (strcmp("fstypes", ans[i].sysctl_name) == 0)
   1284   1.4     pooka 			break;
   1285   1.4     pooka 	if (i == alen/sizeof(ans[0])) {
   1286   1.4     pooka 		errno = ENXIO;
   1287   1.4     pooka 		return -1;
   1288   1.4     pooka 	}
   1289   1.4     pooka 
   1290   1.4     pooka 	mib[0] = CTL_VFS;
   1291   1.4     pooka 	mib[1] = VFS_GENERIC;
   1292   1.4     pooka 	mib[2] = ans[i].sysctl_num;
   1293   1.4     pooka 
   1294  1.21     pooka 	if (rump_sys___sysctl(mib, 3, buf, &buflen, NULL, 0) == -1) {
   1295   1.4     pooka 		return -1;
   1296   1.4     pooka 	}
   1297   1.4     pooka 
   1298   1.4     pooka 	return buflen;
   1299   1.4     pooka }
   1300   1.3     pooka 
   1301   1.3     pooka /*
   1302   1.3     pooka  * Utilities
   1303   1.3     pooka  */
   1304  1.30     pooka static int
   1305  1.30     pooka builddirs(const char *pathname, mode_t mode,
   1306  1.30     pooka 	int (*mkdirfn)(struct ukfs *, const char *, mode_t), struct ukfs *fs)
   1307   1.1     pooka {
   1308   1.1     pooka 	char *f1, *f2;
   1309   1.1     pooka 	int rv;
   1310   1.1     pooka 	mode_t mask;
   1311   1.1     pooka 	bool end;
   1312   1.1     pooka 
   1313   1.1     pooka 	/*ukfs_umask((mask = ukfs_umask(0)));*/
   1314   1.1     pooka 	umask((mask = umask(0)));
   1315   1.1     pooka 
   1316   1.1     pooka 	f1 = f2 = strdup(pathname);
   1317   1.1     pooka 	if (f1 == NULL) {
   1318   1.1     pooka 		errno = ENOMEM;
   1319   1.1     pooka 		return -1;
   1320   1.1     pooka 	}
   1321   1.1     pooka 
   1322   1.1     pooka 	end = false;
   1323   1.1     pooka 	for (;;) {
   1324   1.1     pooka 		/* find next component */
   1325   1.1     pooka 		f2 += strspn(f2, "/");
   1326   1.1     pooka 		f2 += strcspn(f2, "/");
   1327   1.1     pooka 		if (*f2 == '\0')
   1328   1.1     pooka 			end = true;
   1329   1.1     pooka 		else
   1330   1.1     pooka 			*f2 = '\0';
   1331   1.1     pooka 
   1332  1.30     pooka 		rv = mkdirfn(fs, f1, mode & ~mask);
   1333   1.1     pooka 		if (errno == EEXIST)
   1334   1.1     pooka 			rv = 0;
   1335   1.1     pooka 
   1336   1.1     pooka 		if (rv == -1 || *f2 != '\0' || end)
   1337   1.1     pooka 			break;
   1338   1.1     pooka 
   1339   1.1     pooka 		*f2 = '/';
   1340   1.1     pooka 	}
   1341   1.1     pooka 
   1342   1.1     pooka 	free(f1);
   1343   1.1     pooka 
   1344   1.1     pooka 	return rv;
   1345   1.1     pooka }
   1346  1.30     pooka 
   1347  1.30     pooka int
   1348  1.30     pooka ukfs_util_builddirs(struct ukfs *ukfs, const char *pathname, mode_t mode)
   1349  1.30     pooka {
   1350  1.30     pooka 
   1351  1.30     pooka 	return builddirs(pathname, mode, ukfs_mkdir, ukfs);
   1352  1.30     pooka }
   1353