Home | History | Annotate | Line # | Download | only in kern
sys_descrip.c revision 1.27.2.3
      1  1.27.2.2       tls /*	$NetBSD: sys_descrip.c,v 1.27.2.3 2017/12/03 11:38:45 jdolecek Exp $	*/
      2       1.1        ad 
      3       1.1        ad /*-
      4       1.1        ad  * Copyright (c) 2008 The NetBSD Foundation, Inc.
      5       1.1        ad  * All rights reserved.
      6       1.1        ad  *
      7       1.1        ad  * Redistribution and use in source and binary forms, with or without
      8       1.1        ad  * modification, are permitted provided that the following conditions
      9       1.1        ad  * are met:
     10       1.1        ad  * 1. Redistributions of source code must retain the above copyright
     11       1.1        ad  *    notice, this list of conditions and the following disclaimer.
     12       1.1        ad  * 2. Redistributions in binary form must reproduce the above copyright
     13       1.1        ad  *    notice, this list of conditions and the following disclaimer in the
     14       1.1        ad  *    documentation and/or other materials provided with the distribution.
     15       1.1        ad  *
     16       1.1        ad  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     17       1.1        ad  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     18       1.1        ad  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     19       1.1        ad  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     20       1.1        ad  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     21       1.1        ad  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     22       1.1        ad  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     23       1.1        ad  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     24       1.1        ad  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     25       1.1        ad  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     26       1.1        ad  * POSSIBILITY OF SUCH DAMAGE.
     27       1.1        ad  */
     28       1.1        ad 
     29       1.1        ad /*
     30       1.1        ad  * Copyright (c) 1982, 1986, 1989, 1991, 1993
     31       1.1        ad  *	The Regents of the University of California.  All rights reserved.
     32       1.1        ad  * (c) UNIX System Laboratories, Inc.
     33       1.1        ad  * All or some portions of this file are derived from material licensed
     34       1.1        ad  * to the University of California by American Telephone and Telegraph
     35       1.1        ad  * Co. or Unix System Laboratories, Inc. and are reproduced herein with
     36       1.1        ad  * the permission of UNIX System Laboratories, Inc.
     37       1.1        ad  *
     38       1.1        ad  * Redistribution and use in source and binary forms, with or without
     39       1.1        ad  * modification, are permitted provided that the following conditions
     40       1.1        ad  * are met:
     41       1.1        ad  * 1. Redistributions of source code must retain the above copyright
     42       1.1        ad  *    notice, this list of conditions and the following disclaimer.
     43       1.1        ad  * 2. Redistributions in binary form must reproduce the above copyright
     44       1.1        ad  *    notice, this list of conditions and the following disclaimer in the
     45       1.1        ad  *    documentation and/or other materials provided with the distribution.
     46       1.1        ad  * 3. Neither the name of the University nor the names of its contributors
     47       1.1        ad  *    may be used to endorse or promote products derived from this software
     48       1.1        ad  *    without specific prior written permission.
     49       1.1        ad  *
     50       1.1        ad  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     51       1.1        ad  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     52       1.1        ad  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     53       1.1        ad  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     54       1.1        ad  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     55       1.1        ad  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     56       1.1        ad  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     57       1.1        ad  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     58       1.1        ad  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     59       1.1        ad  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     60       1.1        ad  * SUCH DAMAGE.
     61       1.1        ad  *
     62       1.1        ad  *	@(#)kern_descrip.c	8.8 (Berkeley) 2/14/95
     63       1.1        ad  */
     64       1.1        ad 
     65       1.1        ad /*
     66       1.1        ad  * System calls on descriptors.
     67       1.1        ad  */
     68       1.1        ad 
     69       1.1        ad #include <sys/cdefs.h>
     70  1.27.2.2       tls __KERNEL_RCSID(0, "$NetBSD: sys_descrip.c,v 1.27.2.3 2017/12/03 11:38:45 jdolecek Exp $");
     71       1.1        ad 
     72       1.1        ad #include <sys/param.h>
     73       1.1        ad #include <sys/systm.h>
     74       1.1        ad #include <sys/filedesc.h>
     75       1.1        ad #include <sys/kernel.h>
     76       1.1        ad #include <sys/vnode.h>
     77       1.1        ad #include <sys/proc.h>
     78       1.1        ad #include <sys/file.h>
     79       1.1        ad #include <sys/namei.h>
     80       1.1        ad #include <sys/socket.h>
     81       1.1        ad #include <sys/socketvar.h>
     82       1.1        ad #include <sys/stat.h>
     83       1.1        ad #include <sys/ioctl.h>
     84       1.1        ad #include <sys/fcntl.h>
     85      1.10      yamt #include <sys/kmem.h>
     86       1.1        ad #include <sys/pool.h>
     87       1.1        ad #include <sys/syslog.h>
     88       1.1        ad #include <sys/unistd.h>
     89       1.1        ad #include <sys/resourcevar.h>
     90       1.1        ad #include <sys/conf.h>
     91       1.1        ad #include <sys/event.h>
     92       1.1        ad #include <sys/kauth.h>
     93       1.1        ad #include <sys/atomic.h>
     94       1.1        ad #include <sys/mount.h>
     95       1.1        ad #include <sys/syscallargs.h>
     96       1.1        ad 
     97      1.15      yamt #include <uvm/uvm_readahead.h>
     98      1.15      yamt 
     99       1.1        ad /*
    100       1.1        ad  * Duplicate a file descriptor.
    101       1.1        ad  */
    102       1.1        ad int
    103       1.1        ad sys_dup(struct lwp *l, const struct sys_dup_args *uap, register_t *retval)
    104       1.1        ad {
    105       1.1        ad 	/* {
    106       1.1        ad 		syscallarg(int)	fd;
    107       1.1        ad 	} */
    108  1.27.2.3  jdolecek 	int error, newfd, oldfd;
    109       1.1        ad 	file_t *fp;
    110       1.1        ad 
    111  1.27.2.3  jdolecek 	oldfd = SCARG(uap, fd);
    112       1.1        ad 
    113  1.27.2.3  jdolecek 	if ((fp = fd_getfile(oldfd)) == NULL) {
    114       1.1        ad 		return EBADF;
    115       1.1        ad 	}
    116  1.27.2.3  jdolecek 	error = fd_dup(fp, 0, &newfd, false);
    117  1.27.2.3  jdolecek 	fd_putfile(oldfd);
    118  1.27.2.3  jdolecek 	*retval = newfd;
    119       1.1        ad 	return error;
    120       1.1        ad }
    121       1.1        ad 
    122       1.1        ad /*
    123       1.1        ad  * Duplicate a file descriptor to a particular value.
    124       1.1        ad  */
    125      1.26    martin int
    126      1.22  christos dodup(struct lwp *l, int from, int to, int flags, register_t *retval)
    127       1.1        ad {
    128      1.22  christos 	int error;
    129       1.1        ad 	file_t *fp;
    130       1.1        ad 
    131      1.22  christos 	if ((fp = fd_getfile(from)) == NULL)
    132       1.1        ad 		return EBADF;
    133       1.8        ad 	mutex_enter(&fp->f_lock);
    134       1.8        ad 	fp->f_count++;
    135       1.8        ad 	mutex_exit(&fp->f_lock);
    136      1.22  christos 	fd_putfile(from);
    137       1.8        ad 
    138      1.22  christos 	if ((u_int)to >= curproc->p_rlimit[RLIMIT_NOFILE].rlim_cur ||
    139      1.22  christos 	    (u_int)to >= maxfiles)
    140       1.1        ad 		error = EBADF;
    141      1.22  christos 	else if (from == to)
    142       1.1        ad 		error = 0;
    143      1.22  christos 	else
    144      1.22  christos 		error = fd_dup2(fp, to, flags);
    145       1.8        ad 	closef(fp);
    146      1.22  christos 	*retval = to;
    147       1.1        ad 
    148       1.6     njoly 	return error;
    149       1.1        ad }
    150       1.1        ad 
    151      1.22  christos int
    152      1.22  christos sys_dup3(struct lwp *l, const struct sys_dup3_args *uap, register_t *retval)
    153      1.22  christos {
    154      1.22  christos 	/* {
    155      1.22  christos 		syscallarg(int)	from;
    156      1.22  christos 		syscallarg(int)	to;
    157      1.22  christos 		syscallarg(int)	flags;
    158      1.22  christos 	} */
    159      1.22  christos 	return dodup(l, SCARG(uap, from), SCARG(uap, to), SCARG(uap, flags),
    160      1.22  christos 	    retval);
    161      1.22  christos }
    162      1.22  christos 
    163      1.22  christos int
    164      1.22  christos sys_dup2(struct lwp *l, const struct sys_dup2_args *uap, register_t *retval)
    165      1.22  christos {
    166      1.22  christos 	/* {
    167      1.22  christos 		syscallarg(int)	from;
    168      1.22  christos 		syscallarg(int)	to;
    169      1.22  christos 	} */
    170      1.22  christos 	return dodup(l, SCARG(uap, from), SCARG(uap, to), 0, retval);
    171      1.22  christos }
    172      1.22  christos 
    173       1.1        ad /*
    174       1.1        ad  * fcntl call which is being passed to the file's fs.
    175       1.1        ad  */
    176       1.1        ad static int
    177       1.1        ad fcntl_forfs(int fd, file_t *fp, int cmd, void *arg)
    178       1.1        ad {
    179       1.1        ad 	int		error;
    180       1.1        ad 	u_int		size;
    181       1.1        ad 	void		*data, *memp;
    182       1.1        ad #define STK_PARAMS	128
    183       1.1        ad 	char		stkbuf[STK_PARAMS];
    184       1.1        ad 
    185       1.1        ad 	if ((fp->f_flag & (FREAD | FWRITE)) == 0)
    186       1.1        ad 		return (EBADF);
    187       1.1        ad 
    188       1.1        ad 	/*
    189       1.1        ad 	 * Interpret high order word to find amount of data to be
    190       1.1        ad 	 * copied to/from the user's address space.
    191       1.1        ad 	 */
    192       1.1        ad 	size = (size_t)F_PARAM_LEN(cmd);
    193       1.1        ad 	if (size > F_PARAM_MAX)
    194       1.1        ad 		return (EINVAL);
    195       1.1        ad 	memp = NULL;
    196       1.1        ad 	if (size > sizeof(stkbuf)) {
    197       1.1        ad 		memp = kmem_alloc(size, KM_SLEEP);
    198       1.1        ad 		data = memp;
    199       1.1        ad 	} else
    200       1.1        ad 		data = stkbuf;
    201       1.1        ad 	if (cmd & F_FSIN) {
    202       1.1        ad 		if (size) {
    203       1.1        ad 			error = copyin(arg, data, size);
    204       1.1        ad 			if (error) {
    205       1.1        ad 				if (memp)
    206       1.1        ad 					kmem_free(memp, size);
    207       1.1        ad 				return (error);
    208       1.1        ad 			}
    209       1.1        ad 		} else
    210       1.1        ad 			*(void **)data = arg;
    211       1.1        ad 	} else if ((cmd & F_FSOUT) != 0 && size != 0) {
    212       1.1        ad 		/*
    213       1.1        ad 		 * Zero the buffer so the user always
    214       1.1        ad 		 * gets back something deterministic.
    215       1.1        ad 		 */
    216       1.1        ad 		memset(data, 0, size);
    217       1.1        ad 	} else if (cmd & F_FSVOID)
    218       1.1        ad 		*(void **)data = arg;
    219       1.1        ad 
    220       1.1        ad 
    221       1.1        ad 	error = (*fp->f_ops->fo_fcntl)(fp, cmd, data);
    222       1.1        ad 
    223       1.1        ad 	/*
    224       1.1        ad 	 * Copy any data to user, size was
    225       1.1        ad 	 * already set and checked above.
    226       1.1        ad 	 */
    227       1.1        ad 	if (error == 0 && (cmd & F_FSOUT) && size)
    228       1.1        ad 		error = copyout(data, arg, size);
    229       1.1        ad 	if (memp)
    230       1.1        ad 		kmem_free(memp, size);
    231       1.1        ad 	return (error);
    232       1.1        ad }
    233       1.1        ad 
    234       1.1        ad int
    235       1.1        ad do_fcntl_lock(int fd, int cmd, struct flock *fl)
    236       1.1        ad {
    237       1.1        ad 	file_t *fp;
    238       1.1        ad 	vnode_t *vp;
    239       1.1        ad 	proc_t *p;
    240       1.1        ad 	int error, flg;
    241       1.1        ad 
    242       1.1        ad 	if ((fp = fd_getfile(fd)) == NULL)
    243       1.1        ad 		return EBADF;
    244       1.1        ad 	if (fp->f_type != DTYPE_VNODE) {
    245       1.1        ad 		fd_putfile(fd);
    246       1.1        ad 		return EINVAL;
    247       1.1        ad 	}
    248  1.27.2.3  jdolecek 	vp = fp->f_vnode;
    249       1.1        ad 	if (fl->l_whence == SEEK_CUR)
    250       1.1        ad 		fl->l_start += fp->f_offset;
    251       1.1        ad 
    252       1.1        ad 	flg = F_POSIX;
    253       1.1        ad 	p = curproc;
    254       1.1        ad 
    255       1.1        ad 	switch (cmd) {
    256       1.1        ad 	case F_SETLKW:
    257       1.1        ad 		flg |= F_WAIT;
    258       1.1        ad 		/* Fall into F_SETLK */
    259       1.1        ad 
    260       1.1        ad 	case F_SETLK:
    261       1.1        ad 		switch (fl->l_type) {
    262       1.1        ad 		case F_RDLCK:
    263       1.1        ad 			if ((fp->f_flag & FREAD) == 0) {
    264       1.1        ad 				error = EBADF;
    265       1.1        ad 				break;
    266       1.1        ad 			}
    267       1.1        ad 			if ((p->p_flag & PK_ADVLOCK) == 0) {
    268       1.2        ad 				mutex_enter(p->p_lock);
    269       1.1        ad 				p->p_flag |= PK_ADVLOCK;
    270       1.2        ad 				mutex_exit(p->p_lock);
    271       1.1        ad 			}
    272       1.1        ad 			error = VOP_ADVLOCK(vp, p, F_SETLK, fl, flg);
    273       1.1        ad 			break;
    274       1.1        ad 
    275       1.1        ad 		case F_WRLCK:
    276       1.1        ad 			if ((fp->f_flag & FWRITE) == 0) {
    277       1.1        ad 				error = EBADF;
    278       1.1        ad 				break;
    279       1.1        ad 			}
    280       1.1        ad 			if ((p->p_flag & PK_ADVLOCK) == 0) {
    281       1.2        ad 				mutex_enter(p->p_lock);
    282       1.1        ad 				p->p_flag |= PK_ADVLOCK;
    283       1.2        ad 				mutex_exit(p->p_lock);
    284       1.1        ad 			}
    285       1.1        ad 			error = VOP_ADVLOCK(vp, p, F_SETLK, fl, flg);
    286       1.1        ad 			break;
    287       1.1        ad 
    288       1.1        ad 		case F_UNLCK:
    289       1.1        ad 			error = VOP_ADVLOCK(vp, p, F_UNLCK, fl, F_POSIX);
    290       1.1        ad 			break;
    291       1.1        ad 
    292       1.1        ad 		default:
    293       1.1        ad 			error = EINVAL;
    294       1.1        ad 			break;
    295       1.1        ad 		}
    296       1.1        ad 		break;
    297       1.1        ad 
    298       1.1        ad 	case F_GETLK:
    299       1.1        ad 		if (fl->l_type != F_RDLCK &&
    300       1.1        ad 		    fl->l_type != F_WRLCK &&
    301       1.1        ad 		    fl->l_type != F_UNLCK) {
    302       1.1        ad 			error = EINVAL;
    303       1.1        ad 			break;
    304       1.1        ad 		}
    305       1.1        ad 		error = VOP_ADVLOCK(vp, p, F_GETLK, fl, F_POSIX);
    306       1.1        ad 		break;
    307       1.1        ad 
    308       1.1        ad 	default:
    309       1.1        ad 		error = EINVAL;
    310       1.1        ad 		break;
    311       1.1        ad 	}
    312       1.1        ad 
    313       1.1        ad 	fd_putfile(fd);
    314       1.1        ad 	return error;
    315       1.1        ad }
    316       1.1        ad 
    317       1.1        ad /*
    318       1.1        ad  * The file control system call.
    319       1.1        ad  */
    320       1.1        ad int
    321       1.1        ad sys_fcntl(struct lwp *l, const struct sys_fcntl_args *uap, register_t *retval)
    322       1.1        ad {
    323       1.1        ad 	/* {
    324       1.1        ad 		syscallarg(int)		fd;
    325       1.1        ad 		syscallarg(int)		cmd;
    326       1.1        ad 		syscallarg(void *)	arg;
    327       1.1        ad 	} */
    328       1.1        ad 	int fd, i, tmp, error, cmd, newmin;
    329       1.1        ad 	filedesc_t *fdp;
    330       1.1        ad 	file_t *fp;
    331       1.1        ad 	struct flock fl;
    332      1.22  christos 	bool cloexec = false;
    333       1.1        ad 
    334       1.1        ad 	fd = SCARG(uap, fd);
    335       1.1        ad 	cmd = SCARG(uap, cmd);
    336       1.4        ad 	fdp = l->l_fd;
    337       1.1        ad 	error = 0;
    338       1.1        ad 
    339       1.1        ad 	switch (cmd) {
    340       1.1        ad 	case F_CLOSEM:
    341       1.1        ad 		if (fd < 0)
    342       1.1        ad 			return EBADF;
    343       1.1        ad 		while ((i = fdp->fd_lastfile) >= fd) {
    344       1.1        ad 			if (fd_getfile(i) == NULL) {
    345       1.1        ad 				/* Another thread has updated. */
    346       1.1        ad 				continue;
    347       1.1        ad 			}
    348       1.1        ad 			fd_close(i);
    349       1.1        ad 		}
    350       1.1        ad 		return 0;
    351       1.1        ad 
    352       1.1        ad 	case F_MAXFD:
    353       1.1        ad 		*retval = fdp->fd_lastfile;
    354       1.1        ad 		return 0;
    355       1.1        ad 
    356       1.1        ad 	case F_SETLKW:
    357       1.1        ad 	case F_SETLK:
    358       1.1        ad 	case F_GETLK:
    359       1.1        ad 		error = copyin(SCARG(uap, arg), &fl, sizeof(fl));
    360       1.1        ad 		if (error)
    361       1.1        ad 			return error;
    362       1.1        ad 		error = do_fcntl_lock(fd, cmd, &fl);
    363       1.1        ad 		if (cmd == F_GETLK && error == 0)
    364       1.1        ad 			error = copyout(&fl, SCARG(uap, arg), sizeof(fl));
    365       1.1        ad 		return error;
    366       1.1        ad 
    367       1.1        ad 	default:
    368       1.1        ad 		/* Handled below */
    369       1.1        ad 		break;
    370       1.1        ad 	}
    371       1.1        ad 
    372       1.1        ad 	if ((fp = fd_getfile(fd)) == NULL)
    373       1.1        ad 		return (EBADF);
    374       1.1        ad 
    375       1.1        ad 	if ((cmd & F_FSCTL)) {
    376       1.1        ad 		error = fcntl_forfs(fd, fp, cmd, SCARG(uap, arg));
    377       1.1        ad 		fd_putfile(fd);
    378       1.1        ad 		return error;
    379       1.1        ad 	}
    380       1.1        ad 
    381       1.1        ad 	switch (cmd) {
    382      1.22  christos 	case F_DUPFD_CLOEXEC:
    383      1.22  christos 		cloexec = true;
    384      1.22  christos 		/*FALLTHROUGH*/
    385       1.1        ad 	case F_DUPFD:
    386       1.1        ad 		newmin = (long)SCARG(uap, arg);
    387       1.4        ad 		if ((u_int)newmin >=
    388       1.4        ad 		    l->l_proc->p_rlimit[RLIMIT_NOFILE].rlim_cur ||
    389       1.1        ad 		    (u_int)newmin >= maxfiles) {
    390       1.1        ad 			fd_putfile(fd);
    391       1.1        ad 			return EINVAL;
    392       1.1        ad 		}
    393      1.22  christos 		error = fd_dup(fp, newmin, &i, cloexec);
    394       1.1        ad 		*retval = i;
    395       1.1        ad 		break;
    396       1.1        ad 
    397       1.1        ad 	case F_GETFD:
    398      1.20  christos 		*retval = fdp->fd_dt->dt_ff[fd]->ff_exclose;
    399       1.1        ad 		break;
    400       1.1        ad 
    401       1.1        ad 	case F_SETFD:
    402      1.20  christos 		fd_set_exclose(l, fd,
    403      1.20  christos 		    ((long)SCARG(uap, arg) & FD_CLOEXEC) != 0);
    404       1.1        ad 		break;
    405       1.1        ad 
    406      1.24  christos 	case F_GETNOSIGPIPE:
    407      1.24  christos 		*retval = (fp->f_flag & FNOSIGPIPE) != 0;
    408      1.24  christos 		break;
    409      1.24  christos 
    410      1.24  christos 	case F_SETNOSIGPIPE:
    411      1.24  christos 		if (SCARG(uap, arg))
    412      1.25  christos 			atomic_or_uint(&fp->f_flag, FNOSIGPIPE);
    413      1.24  christos 		else
    414      1.25  christos 			atomic_and_uint(&fp->f_flag, ~FNOSIGPIPE);
    415      1.24  christos 		*retval = 0;
    416      1.24  christos 		break;
    417      1.24  christos 
    418       1.1        ad 	case F_GETFL:
    419       1.1        ad 		*retval = OFLAGS(fp->f_flag);
    420       1.1        ad 		break;
    421       1.1        ad 
    422       1.1        ad 	case F_SETFL:
    423       1.1        ad 		/* XXX not guaranteed to be atomic. */
    424       1.1        ad 		tmp = FFLAGS((long)SCARG(uap, arg)) & FCNTLFLAGS;
    425       1.1        ad 		error = (*fp->f_ops->fo_fcntl)(fp, F_SETFL, &tmp);
    426       1.1        ad 		if (error)
    427       1.1        ad 			break;
    428       1.1        ad 		i = tmp ^ fp->f_flag;
    429       1.1        ad 		if (i & FNONBLOCK) {
    430       1.1        ad 			int flgs = tmp & FNONBLOCK;
    431       1.1        ad 			error = (*fp->f_ops->fo_ioctl)(fp, FIONBIO, &flgs);
    432       1.1        ad 			if (error) {
    433       1.1        ad 				(*fp->f_ops->fo_fcntl)(fp, F_SETFL,
    434       1.1        ad 				    &fp->f_flag);
    435       1.1        ad 				break;
    436       1.1        ad 			}
    437       1.1        ad 		}
    438       1.1        ad 		if (i & FASYNC) {
    439       1.1        ad 			int flgs = tmp & FASYNC;
    440       1.1        ad 			error = (*fp->f_ops->fo_ioctl)(fp, FIOASYNC, &flgs);
    441       1.1        ad 			if (error) {
    442       1.1        ad 				if (i & FNONBLOCK) {
    443       1.1        ad 					tmp = fp->f_flag & FNONBLOCK;
    444       1.1        ad 					(void)(*fp->f_ops->fo_ioctl)(fp,
    445       1.1        ad 						FIONBIO, &tmp);
    446       1.1        ad 				}
    447       1.1        ad 				(*fp->f_ops->fo_fcntl)(fp, F_SETFL,
    448       1.1        ad 				    &fp->f_flag);
    449       1.1        ad 				break;
    450       1.1        ad 			}
    451       1.1        ad 		}
    452       1.1        ad 		fp->f_flag = (fp->f_flag & ~FCNTLFLAGS) | tmp;
    453       1.1        ad 		break;
    454       1.1        ad 
    455       1.1        ad 	case F_GETOWN:
    456       1.1        ad 		error = (*fp->f_ops->fo_ioctl)(fp, FIOGETOWN, &tmp);
    457       1.1        ad 		*retval = tmp;
    458       1.1        ad 		break;
    459       1.1        ad 
    460       1.1        ad 	case F_SETOWN:
    461       1.7     rmind 		tmp = (int)(uintptr_t) SCARG(uap, arg);
    462       1.1        ad 		error = (*fp->f_ops->fo_ioctl)(fp, FIOSETOWN, &tmp);
    463       1.1        ad 		break;
    464       1.1        ad 
    465       1.1        ad 	default:
    466       1.1        ad 		error = EINVAL;
    467       1.1        ad 	}
    468       1.1        ad 
    469       1.1        ad 	fd_putfile(fd);
    470       1.1        ad 	return (error);
    471       1.1        ad }
    472       1.1        ad 
    473       1.1        ad /*
    474       1.1        ad  * Close a file descriptor.
    475       1.1        ad  */
    476       1.1        ad int
    477       1.1        ad sys_close(struct lwp *l, const struct sys_close_args *uap, register_t *retval)
    478       1.1        ad {
    479       1.1        ad 	/* {
    480       1.1        ad 		syscallarg(int)	fd;
    481       1.1        ad 	} */
    482      1.27  riastrad 	int error;
    483       1.1        ad 
    484       1.1        ad 	if (fd_getfile(SCARG(uap, fd)) == NULL) {
    485       1.1        ad 		return EBADF;
    486       1.1        ad 	}
    487      1.27  riastrad 
    488      1.27  riastrad 	error = fd_close(SCARG(uap, fd));
    489      1.27  riastrad 	if (error == ERESTART) {
    490      1.27  riastrad #ifdef DIAGNOSTIC
    491      1.27  riastrad 		printf("pid %d: close returned ERESTART\n",
    492      1.27  riastrad 		    (int)l->l_proc->p_pid);
    493      1.27  riastrad #endif
    494      1.27  riastrad 		error = EINTR;
    495      1.27  riastrad 	}
    496      1.27  riastrad 
    497      1.27  riastrad 	return error;
    498       1.1        ad }
    499       1.1        ad 
    500       1.1        ad /*
    501       1.1        ad  * Return status information about a file descriptor.
    502       1.1        ad  * Common function for compat code.
    503       1.1        ad  */
    504       1.1        ad int
    505       1.1        ad do_sys_fstat(int fd, struct stat *sb)
    506       1.1        ad {
    507       1.1        ad 	file_t *fp;
    508       1.1        ad 	int error;
    509       1.1        ad 
    510       1.1        ad 	if ((fp = fd_getfile(fd)) == NULL) {
    511       1.1        ad 		return EBADF;
    512       1.1        ad 	}
    513       1.1        ad 	error = (*fp->f_ops->fo_stat)(fp, sb);
    514       1.1        ad 	fd_putfile(fd);
    515       1.1        ad 
    516       1.1        ad 	return error;
    517       1.1        ad }
    518       1.1        ad 
    519       1.1        ad /*
    520       1.1        ad  * Return status information about a file descriptor.
    521       1.1        ad  */
    522       1.1        ad int
    523       1.9  christos sys___fstat50(struct lwp *l, const struct sys___fstat50_args *uap,
    524       1.1        ad 	      register_t *retval)
    525       1.1        ad {
    526       1.1        ad 	/* {
    527       1.1        ad 		syscallarg(int)			fd;
    528       1.1        ad 		syscallarg(struct stat *)	sb;
    529       1.1        ad 	} */
    530       1.1        ad 	struct stat sb;
    531       1.1        ad 	int error;
    532       1.1        ad 
    533       1.1        ad 	error = do_sys_fstat(SCARG(uap, fd), &sb);
    534       1.1        ad 	if (error == 0) {
    535       1.1        ad 		error = copyout(&sb, SCARG(uap, sb), sizeof(sb));
    536       1.1        ad 	}
    537       1.1        ad 	return error;
    538       1.1        ad }
    539       1.1        ad 
    540       1.1        ad /*
    541       1.1        ad  * Return pathconf information about a file descriptor.
    542       1.1        ad  */
    543       1.1        ad int
    544       1.1        ad sys_fpathconf(struct lwp *l, const struct sys_fpathconf_args *uap,
    545       1.1        ad 	      register_t *retval)
    546       1.1        ad {
    547       1.1        ad 	/* {
    548       1.1        ad 		syscallarg(int)	fd;
    549       1.1        ad 		syscallarg(int)	name;
    550       1.1        ad 	} */
    551       1.1        ad 	int fd, error;
    552       1.1        ad 	file_t *fp;
    553       1.1        ad 
    554       1.1        ad 	fd = SCARG(uap, fd);
    555       1.1        ad 	error = 0;
    556       1.1        ad 
    557       1.1        ad 	if ((fp = fd_getfile(fd)) == NULL) {
    558       1.1        ad 		return (EBADF);
    559       1.1        ad 	}
    560       1.1        ad 	switch (fp->f_type) {
    561       1.1        ad 	case DTYPE_SOCKET:
    562       1.1        ad 	case DTYPE_PIPE:
    563       1.1        ad 		if (SCARG(uap, name) != _PC_PIPE_BUF)
    564       1.1        ad 			error = EINVAL;
    565       1.1        ad 		else
    566       1.1        ad 			*retval = PIPE_BUF;
    567       1.1        ad 		break;
    568       1.1        ad 
    569       1.1        ad 	case DTYPE_VNODE:
    570  1.27.2.3  jdolecek 		error = VOP_PATHCONF(fp->f_vnode, SCARG(uap, name), retval);
    571       1.1        ad 		break;
    572       1.1        ad 
    573       1.1        ad 	case DTYPE_KQUEUE:
    574       1.1        ad 		error = EINVAL;
    575       1.1        ad 		break;
    576       1.1        ad 
    577       1.1        ad 	default:
    578       1.1        ad 		error = EOPNOTSUPP;
    579       1.1        ad 		break;
    580       1.1        ad 	}
    581       1.1        ad 
    582       1.1        ad 	fd_putfile(fd);
    583       1.1        ad 	return (error);
    584       1.1        ad }
    585       1.1        ad 
    586       1.1        ad /*
    587       1.1        ad  * Apply an advisory lock on a file descriptor.
    588       1.1        ad  *
    589       1.1        ad  * Just attempt to get a record lock of the requested type on
    590       1.1        ad  * the entire file (l_whence = SEEK_SET, l_start = 0, l_len = 0).
    591       1.1        ad  */
    592       1.1        ad /* ARGSUSED */
    593       1.1        ad int
    594       1.1        ad sys_flock(struct lwp *l, const struct sys_flock_args *uap, register_t *retval)
    595       1.1        ad {
    596       1.1        ad 	/* {
    597       1.1        ad 		syscallarg(int)	fd;
    598       1.1        ad 		syscallarg(int)	how;
    599       1.1        ad 	} */
    600       1.1        ad 	int fd, how, error;
    601       1.1        ad 	file_t *fp;
    602       1.1        ad 	vnode_t	*vp;
    603       1.1        ad 	struct flock lf;
    604       1.1        ad 
    605       1.1        ad 	fd = SCARG(uap, fd);
    606       1.1        ad 	how = SCARG(uap, how);
    607       1.1        ad 	error = 0;
    608       1.1        ad 
    609       1.1        ad 	if ((fp = fd_getfile(fd)) == NULL) {
    610       1.1        ad 		return EBADF;
    611       1.1        ad 	}
    612       1.1        ad 	if (fp->f_type != DTYPE_VNODE) {
    613       1.1        ad 		fd_putfile(fd);
    614       1.1        ad 		return EOPNOTSUPP;
    615       1.1        ad 	}
    616       1.1        ad 
    617  1.27.2.3  jdolecek 	vp = fp->f_vnode;
    618       1.1        ad 	lf.l_whence = SEEK_SET;
    619       1.1        ad 	lf.l_start = 0;
    620       1.1        ad 	lf.l_len = 0;
    621      1.17     njoly 
    622      1.17     njoly 	switch (how & ~LOCK_NB) {
    623      1.17     njoly 	case LOCK_UN:
    624       1.1        ad 		lf.l_type = F_UNLCK;
    625       1.1        ad 		atomic_and_uint(&fp->f_flag, ~FHASLOCK);
    626       1.1        ad 		error = VOP_ADVLOCK(vp, fp, F_UNLCK, &lf, F_FLOCK);
    627       1.1        ad 		fd_putfile(fd);
    628       1.1        ad 		return error;
    629      1.17     njoly 	case LOCK_EX:
    630       1.1        ad 		lf.l_type = F_WRLCK;
    631      1.17     njoly 		break;
    632      1.17     njoly 	case LOCK_SH:
    633       1.1        ad 		lf.l_type = F_RDLCK;
    634      1.17     njoly 		break;
    635      1.17     njoly 	default:
    636       1.1        ad 		fd_putfile(fd);
    637       1.1        ad 		return EINVAL;
    638       1.1        ad 	}
    639      1.17     njoly 
    640       1.1        ad 	atomic_or_uint(&fp->f_flag, FHASLOCK);
    641       1.1        ad 	if (how & LOCK_NB) {
    642       1.1        ad 		error = VOP_ADVLOCK(vp, fp, F_SETLK, &lf, F_FLOCK);
    643       1.1        ad 	} else {
    644       1.1        ad 		error = VOP_ADVLOCK(vp, fp, F_SETLK, &lf, F_FLOCK|F_WAIT);
    645       1.1        ad 	}
    646       1.1        ad 	fd_putfile(fd);
    647       1.1        ad 	return error;
    648       1.1        ad }
    649       1.1        ad 
    650       1.1        ad int
    651       1.1        ad do_posix_fadvise(int fd, off_t offset, off_t len, int advice)
    652       1.1        ad {
    653       1.1        ad 	file_t *fp;
    654      1.15      yamt 	vnode_t *vp;
    655      1.16      yamt 	off_t endoffset;
    656       1.1        ad 	int error;
    657      1.18     rmind 
    658      1.14      yamt 	CTASSERT(POSIX_FADV_NORMAL == UVM_ADV_NORMAL);
    659      1.14      yamt 	CTASSERT(POSIX_FADV_RANDOM == UVM_ADV_RANDOM);
    660      1.14      yamt 	CTASSERT(POSIX_FADV_SEQUENTIAL == UVM_ADV_SEQUENTIAL);
    661       1.1        ad 
    662      1.16      yamt 	if (len == 0) {
    663      1.16      yamt 		endoffset = INT64_MAX;
    664      1.18     rmind 	} else if (len > 0 && (INT64_MAX - offset) >= len) {
    665      1.16      yamt 		endoffset = offset + len;
    666      1.16      yamt 	} else {
    667      1.16      yamt 		return EINVAL;
    668      1.16      yamt 	}
    669       1.1        ad 	if ((fp = fd_getfile(fd)) == NULL) {
    670       1.1        ad 		return EBADF;
    671       1.1        ad 	}
    672       1.1        ad 	if (fp->f_type != DTYPE_VNODE) {
    673       1.1        ad 		if (fp->f_type == DTYPE_PIPE || fp->f_type == DTYPE_SOCKET) {
    674       1.1        ad 			error = ESPIPE;
    675       1.1        ad 		} else {
    676       1.1        ad 			error = EOPNOTSUPP;
    677       1.1        ad 		}
    678       1.1        ad 		fd_putfile(fd);
    679       1.1        ad 		return error;
    680       1.1        ad 	}
    681       1.1        ad 
    682       1.1        ad 	switch (advice) {
    683      1.16      yamt 	case POSIX_FADV_WILLNEED:
    684      1.16      yamt 	case POSIX_FADV_DONTNEED:
    685  1.27.2.3  jdolecek 		vp = fp->f_vnode;
    686      1.16      yamt 		if (vp->v_type != VREG && vp->v_type != VBLK) {
    687      1.16      yamt 			fd_putfile(fd);
    688      1.16      yamt 			return 0;
    689      1.16      yamt 		}
    690      1.16      yamt 		break;
    691      1.16      yamt 	}
    692      1.16      yamt 
    693      1.16      yamt 	switch (advice) {
    694       1.1        ad 	case POSIX_FADV_NORMAL:
    695       1.1        ad 	case POSIX_FADV_RANDOM:
    696       1.1        ad 	case POSIX_FADV_SEQUENTIAL:
    697       1.1        ad 		/*
    698      1.19     rmind 		 * We ignore offset and size.  Must lock the file to
    699       1.1        ad 		 * do this, as f_advice is sub-word sized.
    700       1.1        ad 		 */
    701       1.1        ad 		mutex_enter(&fp->f_lock);
    702       1.1        ad 		fp->f_advice = (u_char)advice;
    703       1.1        ad 		mutex_exit(&fp->f_lock);
    704       1.1        ad 		error = 0;
    705       1.1        ad 		break;
    706       1.1        ad 
    707       1.1        ad 	case POSIX_FADV_WILLNEED:
    708      1.15      yamt 		vp = fp->f_data;
    709  1.27.2.1       tls 		error = uvm_readahead(&vp->v_uobj, offset,
    710  1.27.2.1       tls 				      endoffset - offset,
    711  1.27.2.1       tls 				      vp->v_ractx);
    712      1.15      yamt 		break;
    713      1.15      yamt 
    714       1.1        ad 	case POSIX_FADV_DONTNEED:
    715  1.27.2.3  jdolecek 		vp = fp->f_vnode;
    716      1.19     rmind 		/*
    717      1.19     rmind 		 * Align the region to page boundaries as VOP_PUTPAGES expects
    718      1.19     rmind 		 * by shrinking it.  We shrink instead of expand because we
    719      1.19     rmind 		 * do not want to deactivate cache outside of the requested
    720      1.19     rmind 		 * region.  It means that if the specified region is smaller
    721      1.19     rmind 		 * than PAGE_SIZE, we do nothing.
    722      1.19     rmind 		 */
    723      1.19     rmind 		if (round_page(offset) < trunc_page(endoffset) &&
    724      1.19     rmind 		    offset <= round_page(offset)) {
    725      1.21     rmind 			mutex_enter(vp->v_interlock);
    726      1.19     rmind 			error = VOP_PUTPAGES(vp,
    727      1.19     rmind 			    round_page(offset), trunc_page(endoffset),
    728      1.19     rmind 			    PGO_DEACTIVATE | PGO_CLEANIT);
    729      1.19     rmind 		} else {
    730      1.19     rmind 			error = 0;
    731      1.19     rmind 		}
    732      1.16      yamt 		break;
    733      1.16      yamt 
    734       1.1        ad 	case POSIX_FADV_NOREUSE:
    735       1.1        ad 		/* Not implemented yet. */
    736       1.1        ad 		error = 0;
    737       1.1        ad 		break;
    738       1.1        ad 	default:
    739       1.1        ad 		error = EINVAL;
    740       1.1        ad 		break;
    741       1.1        ad 	}
    742       1.1        ad 
    743       1.1        ad 	fd_putfile(fd);
    744       1.1        ad 	return error;
    745       1.1        ad }
    746       1.1        ad 
    747       1.1        ad int
    748       1.1        ad sys___posix_fadvise50(struct lwp *l,
    749       1.1        ad 		      const struct sys___posix_fadvise50_args *uap,
    750       1.1        ad 		      register_t *retval)
    751       1.1        ad {
    752       1.1        ad 	/* {
    753       1.1        ad 		syscallarg(int) fd;
    754       1.1        ad 		syscallarg(int) pad;
    755       1.1        ad 		syscallarg(off_t) offset;
    756       1.1        ad 		syscallarg(off_t) len;
    757       1.1        ad 		syscallarg(int) advice;
    758       1.1        ad 	} */
    759       1.1        ad 
    760      1.11     skrll 	*retval = do_posix_fadvise(SCARG(uap, fd), SCARG(uap, offset),
    761       1.1        ad 	    SCARG(uap, len), SCARG(uap, advice));
    762      1.11     skrll 
    763      1.11     skrll 	return 0;
    764       1.1        ad }
    765      1.22  christos 
    766      1.22  christos int
    767      1.22  christos sys_pipe(struct lwp *l, const void *v, register_t *retval)
    768      1.22  christos {
    769      1.22  christos 	return pipe1(l, retval, 0);
    770      1.22  christos }
    771      1.22  christos 
    772      1.22  christos int
    773      1.22  christos sys_pipe2(struct lwp *l, const struct sys_pipe2_args *uap, register_t *retval)
    774      1.22  christos {
    775      1.22  christos 	/* {
    776      1.22  christos 		syscallarg(int[2]) fildes;
    777      1.22  christos 		syscallarg(int) flags;
    778      1.22  christos 	} */
    779      1.22  christos 	int fd[2], error;
    780      1.22  christos 
    781      1.22  christos 	if ((error = pipe1(l, retval, SCARG(uap, flags))) != 0)
    782      1.22  christos 		return error;
    783      1.22  christos 	fd[0] = retval[0];
    784      1.22  christos 	fd[1] = retval[1];
    785      1.23  christos 	if ((error = copyout(fd, SCARG(uap, fildes), sizeof(fd))) != 0)
    786      1.23  christos 		return error;
    787      1.23  christos 	retval[0] = 0;
    788      1.23  christos 	return 0;
    789      1.22  christos }
    790