Home | History | Annotate | Line # | Download | only in dmover
dmover_io.c revision 1.42.2.1
      1  1.42.2.1       tls /*	$NetBSD: dmover_io.c,v 1.42.2.1 2014/08/10 06:54:51 tls Exp $	*/
      2       1.1   thorpej 
      3       1.1   thorpej /*
      4      1.12   thorpej  * Copyright (c) 2002, 2003 Wasabi Systems, Inc.
      5       1.1   thorpej  * All rights reserved.
      6       1.1   thorpej  *
      7       1.1   thorpej  * Written by Jason R. Thorpe for Wasabi Systems, Inc.
      8       1.1   thorpej  *
      9       1.1   thorpej  * Redistribution and use in source and binary forms, with or without
     10       1.1   thorpej  * modification, are permitted provided that the following conditions
     11       1.1   thorpej  * are met:
     12       1.1   thorpej  * 1. Redistributions of source code must retain the above copyright
     13       1.1   thorpej  *    notice, this list of conditions and the following disclaimer.
     14       1.1   thorpej  * 2. Redistributions in binary form must reproduce the above copyright
     15       1.1   thorpej  *    notice, this list of conditions and the following disclaimer in the
     16       1.1   thorpej  *    documentation and/or other materials provided with the distribution.
     17       1.1   thorpej  * 3. All advertising materials mentioning features or use of this software
     18       1.1   thorpej  *    must display the following acknowledgement:
     19       1.1   thorpej  *	This product includes software developed for the NetBSD Project by
     20       1.1   thorpej  *	Wasabi Systems, Inc.
     21       1.1   thorpej  * 4. The name of Wasabi Systems, Inc. may not be used to endorse
     22       1.1   thorpej  *    or promote products derived from this software without specific prior
     23       1.1   thorpej  *    written permission.
     24       1.1   thorpej  *
     25       1.1   thorpej  * THIS SOFTWARE IS PROVIDED BY WASABI SYSTEMS, INC. ``AS IS'' AND
     26       1.1   thorpej  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     27       1.1   thorpej  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     28       1.1   thorpej  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL WASABI SYSTEMS, INC
     29       1.1   thorpej  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     30       1.1   thorpej  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     31       1.1   thorpej  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     32       1.1   thorpej  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     33       1.1   thorpej  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     34       1.1   thorpej  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     35       1.1   thorpej  * POSSIBILITY OF SUCH DAMAGE.
     36       1.1   thorpej  */
     37       1.1   thorpej 
     38       1.1   thorpej /*
     39       1.1   thorpej  * dmover_io.c: Support for user-space access to dmover-api
     40       1.1   thorpej  *
     41       1.1   thorpej  * This interface is quite simple:
     42       1.1   thorpej  *
     43       1.1   thorpej  *	1.  The user opens /dev/dmover, which is a cloning device.  This
     44       1.1   thorpej  *	    allocates internal state for the session.
     45       1.1   thorpej  *
     46       1.1   thorpej  *	2.  The user does a DMIO_SETFUNC to select the data movement
     47       1.1   thorpej  *	    function.  This actually creates the dmover session.
     48       1.1   thorpej  *
     49       1.1   thorpej  *	3.  The user writes request messages to its dmover handle.
     50       1.1   thorpej  *
     51       1.1   thorpej  *	4.  The user reads request responses from its dmover handle.
     52       1.1   thorpej  *
     53       1.1   thorpej  *	5.  The user closes the file descriptor and the session is
     54       1.1   thorpej  *	    torn down.
     55       1.1   thorpej  */
     56       1.1   thorpej 
     57       1.1   thorpej #include <sys/cdefs.h>
     58  1.42.2.1       tls __KERNEL_RCSID(0, "$NetBSD: dmover_io.c,v 1.42.2.1 2014/08/10 06:54:51 tls Exp $");
     59       1.1   thorpej 
     60       1.1   thorpej #include <sys/param.h>
     61       1.1   thorpej #include <sys/queue.h>
     62       1.1   thorpej #include <sys/conf.h>
     63       1.1   thorpej #include <sys/pool.h>
     64       1.1   thorpej #include <sys/proc.h>
     65       1.1   thorpej #include <sys/poll.h>
     66       1.1   thorpej #include <sys/malloc.h>
     67       1.1   thorpej #include <sys/file.h>
     68       1.1   thorpej #include <sys/filedesc.h>
     69       1.1   thorpej #include <sys/filio.h>
     70       1.1   thorpej #include <sys/select.h>
     71       1.1   thorpej #include <sys/systm.h>
     72      1.21      yamt #include <sys/workqueue.h>
     73      1.21      yamt #include <sys/once.h>
     74      1.35    nonaka #include <sys/stat.h>
     75      1.35    nonaka #include <sys/kauth.h>
     76      1.40  jakllsch #include <sys/mutex.h>
     77      1.40  jakllsch #include <sys/condvar.h>
     78      1.21      yamt 
     79      1.39  uebayasi #include <uvm/uvm_extern.h>
     80      1.39  uebayasi 
     81       1.1   thorpej #include <dev/dmover/dmovervar.h>
     82       1.1   thorpej #include <dev/dmover/dmover_io.h>
     83       1.1   thorpej 
     84       1.1   thorpej struct dmio_usrreq_state {
     85      1.21      yamt 	union {
     86      1.21      yamt 		struct work u_work;
     87      1.21      yamt 		TAILQ_ENTRY(dmio_usrreq_state) u_q;
     88      1.21      yamt 	} dus_u;
     89      1.21      yamt #define	dus_q		dus_u.u_q
     90      1.21      yamt #define	dus_work	dus_u.u_work
     91       1.1   thorpej 	struct uio dus_uio_out;
     92       1.1   thorpej 	struct uio *dus_uio_in;
     93       1.1   thorpej 	struct dmover_request *dus_req;
     94       1.1   thorpej 	uint32_t dus_id;
     95      1.21      yamt 	struct vmspace *dus_vmspace;
     96       1.1   thorpej };
     97       1.1   thorpej 
     98       1.1   thorpej struct dmio_state {
     99       1.1   thorpej 	struct dmover_session *ds_session;
    100       1.1   thorpej 	TAILQ_HEAD(, dmio_usrreq_state) ds_pending;
    101       1.1   thorpej 	TAILQ_HEAD(, dmio_usrreq_state) ds_complete;
    102       1.1   thorpej 	struct selinfo ds_selq;
    103      1.19     perry 	volatile int ds_flags;
    104       1.1   thorpej 	u_int ds_nreqs;
    105      1.40  jakllsch 	kmutex_t ds_lock;
    106      1.40  jakllsch 	kcondvar_t ds_complete_cv;
    107      1.40  jakllsch 	kcondvar_t ds_nreqs_cv;
    108      1.33  christos 	struct timespec ds_atime;
    109      1.33  christos 	struct timespec ds_mtime;
    110      1.33  christos 	struct timespec ds_btime;
    111       1.1   thorpej };
    112       1.1   thorpej 
    113      1.21      yamt static ONCE_DECL(dmio_cleaner_control);
    114      1.21      yamt static struct workqueue *dmio_cleaner;
    115      1.21      yamt static int dmio_cleaner_init(void);
    116      1.40  jakllsch static struct dmio_state *dmio_state_get(void);
    117      1.40  jakllsch static void dmio_state_put(struct dmio_state *);
    118      1.21      yamt static void dmio_usrreq_fini1(struct work *wk, void *);
    119      1.21      yamt 
    120       1.1   thorpej #define	DMIO_STATE_SEL		0x0001
    121       1.1   thorpej #define	DMIO_STATE_DEAD		0x0002
    122       1.1   thorpej #define	DMIO_STATE_LARVAL	0x0004
    123       1.1   thorpej #define	DMIO_STATE_READ_WAIT	0x0008
    124       1.1   thorpej #define	DMIO_STATE_WRITE_WAIT	0x0010
    125       1.1   thorpej 
    126       1.1   thorpej #define	DMIO_NREQS_MAX		64	/* XXX pulled out of a hat */
    127       1.1   thorpej 
    128       1.1   thorpej struct pool dmio_state_pool;
    129       1.1   thorpej struct pool dmio_usrreq_state_pool;
    130       1.1   thorpej 
    131       1.1   thorpej void	dmoverioattach(int);
    132       1.5   gehenna 
    133       1.5   gehenna dev_type_open(dmoverioopen);
    134       1.5   gehenna 
    135       1.5   gehenna const struct cdevsw dmoverio_cdevsw = {
    136      1.42  dholland 	.d_open = dmoverioopen,
    137      1.42  dholland 	.d_close = noclose,
    138      1.42  dholland 	.d_read = noread,
    139      1.42  dholland 	.d_write = nowrite,
    140      1.42  dholland 	.d_ioctl = noioctl,
    141      1.42  dholland 	.d_stop = nostop,
    142      1.42  dholland 	.d_tty = notty,
    143      1.42  dholland 	.d_poll = nopoll,
    144      1.42  dholland 	.d_mmap = nommap,
    145      1.42  dholland 	.d_kqfilter = nokqfilter,
    146  1.42.2.1       tls 	.d_discard = nodiscard,
    147      1.42  dholland 	.d_flag = D_OTHER
    148       1.5   gehenna };
    149       1.1   thorpej 
    150       1.1   thorpej /*
    151       1.1   thorpej  * dmoverioattach:
    152       1.1   thorpej  *
    153       1.1   thorpej  *	Pseudo-device attach routine.
    154       1.1   thorpej  */
    155       1.1   thorpej void
    156       1.1   thorpej dmoverioattach(int count)
    157       1.1   thorpej {
    158       1.1   thorpej 
    159       1.1   thorpej 	pool_init(&dmio_state_pool, sizeof(struct dmio_state),
    160      1.26        ad 	    0, 0, 0, "dmiostate", NULL, IPL_SOFTCLOCK);
    161       1.1   thorpej 	pool_init(&dmio_usrreq_state_pool, sizeof(struct dmio_usrreq_state),
    162      1.26        ad 	    0, 0, 0, "dmiourstate", NULL, IPL_SOFTCLOCK);
    163       1.1   thorpej }
    164       1.1   thorpej 
    165       1.1   thorpej /*
    166      1.21      yamt  * dmio_cleaner_init:
    167      1.21      yamt  *
    168      1.21      yamt  *	Create cleaner thread.
    169      1.21      yamt  */
    170      1.21      yamt static int
    171      1.21      yamt dmio_cleaner_init(void)
    172      1.21      yamt {
    173      1.21      yamt 
    174      1.21      yamt 	return workqueue_create(&dmio_cleaner, "dmioclean", dmio_usrreq_fini1,
    175      1.24      yamt 	    NULL, PWAIT, IPL_SOFTCLOCK, 0);
    176      1.21      yamt }
    177      1.21      yamt 
    178      1.40  jakllsch static struct dmio_state *
    179      1.40  jakllsch dmio_state_get(void)
    180      1.40  jakllsch {
    181      1.40  jakllsch 	struct dmio_state *ds;
    182      1.40  jakllsch 
    183      1.40  jakllsch 	ds = pool_get(&dmio_state_pool, PR_WAITOK);
    184      1.40  jakllsch 
    185      1.40  jakllsch 	memset(ds, 0, sizeof(*ds));
    186      1.40  jakllsch 
    187      1.40  jakllsch 	getnanotime(&ds->ds_btime);
    188      1.40  jakllsch 	ds->ds_atime = ds->ds_mtime = ds->ds_btime;
    189      1.40  jakllsch 
    190      1.40  jakllsch 	mutex_init(&ds->ds_lock, MUTEX_DEFAULT, IPL_SOFTCLOCK);
    191      1.40  jakllsch 	cv_init(&ds->ds_complete_cv, "dmvrrd");
    192      1.40  jakllsch 	cv_init(&ds->ds_nreqs_cv, "dmiowr");
    193      1.40  jakllsch 	TAILQ_INIT(&ds->ds_pending);
    194      1.40  jakllsch 	TAILQ_INIT(&ds->ds_complete);
    195      1.40  jakllsch 	selinit(&ds->ds_selq);
    196      1.40  jakllsch 
    197      1.40  jakllsch 	return ds;
    198      1.40  jakllsch }
    199      1.40  jakllsch 
    200      1.40  jakllsch static void
    201      1.40  jakllsch dmio_state_put(struct dmio_state *ds)
    202      1.40  jakllsch {
    203      1.40  jakllsch 
    204      1.40  jakllsch 	seldestroy(&ds->ds_selq);
    205      1.40  jakllsch 	cv_destroy(&ds->ds_nreqs_cv);
    206      1.40  jakllsch 	cv_destroy(&ds->ds_complete_cv);
    207      1.40  jakllsch 	mutex_destroy(&ds->ds_lock);
    208      1.40  jakllsch 
    209      1.40  jakllsch 	pool_put(&dmio_state_pool, ds);
    210      1.40  jakllsch }
    211      1.40  jakllsch 
    212      1.21      yamt /*
    213       1.1   thorpej  * dmio_usrreq_init:
    214       1.1   thorpej  *
    215       1.1   thorpej  *	Build a request structure.
    216       1.1   thorpej  */
    217       1.1   thorpej static int
    218       1.1   thorpej dmio_usrreq_init(struct file *fp, struct dmio_usrreq_state *dus,
    219       1.1   thorpej     struct dmio_usrreq *req, struct dmover_request *dreq)
    220       1.1   thorpej {
    221       1.1   thorpej 	struct dmio_state *ds = (struct dmio_state *) fp->f_data;
    222       1.1   thorpej 	struct dmover_session *dses = ds->ds_session;
    223       1.1   thorpej 	struct uio *uio_out = &dus->dus_uio_out;
    224       1.1   thorpej 	struct uio *uio_in;
    225       1.1   thorpej 	dmio_buffer inbuf;
    226       1.1   thorpej 	size_t len;
    227       1.7   thorpej 	int i, error;
    228       1.7   thorpej 	u_int j;
    229       1.1   thorpej 
    230       1.1   thorpej 	/* XXX How should malloc interact w/ FNONBLOCK? */
    231       1.1   thorpej 
    232      1.21      yamt 	error = RUN_ONCE(&dmio_cleaner_control, dmio_cleaner_init);
    233      1.21      yamt 	if (error) {
    234      1.21      yamt 		return error;
    235      1.21      yamt 	}
    236      1.21      yamt 
    237      1.21      yamt 	error = proc_vmspace_getref(curproc, &dus->dus_vmspace);
    238      1.21      yamt 	if (error) {
    239      1.21      yamt 		return error;
    240      1.21      yamt 	}
    241      1.21      yamt 
    242      1.12   thorpej 	if (req->req_outbuf.dmbuf_iovcnt != 0) {
    243      1.12   thorpej 		if (req->req_outbuf.dmbuf_iovcnt > IOV_MAX)
    244      1.12   thorpej 			return (EINVAL);
    245      1.12   thorpej 		len = sizeof(struct iovec) * req->req_outbuf.dmbuf_iovcnt;
    246      1.12   thorpej 		uio_out->uio_iov = malloc(len, M_TEMP, M_WAITOK);
    247      1.12   thorpej 		error = copyin(req->req_outbuf.dmbuf_iov, uio_out->uio_iov,
    248      1.12   thorpej 		    len);
    249      1.12   thorpej 		if (error) {
    250      1.12   thorpej 			free(uio_out->uio_iov, M_TEMP);
    251      1.12   thorpej 			return (error);
    252      1.12   thorpej 		}
    253       1.1   thorpej 
    254      1.12   thorpej 		for (j = 0, len = 0; j < req->req_outbuf.dmbuf_iovcnt; j++) {
    255      1.12   thorpej 			len += uio_out->uio_iov[j].iov_len;
    256      1.12   thorpej 			if (len > SSIZE_MAX) {
    257      1.12   thorpej 				free(uio_out->uio_iov, M_TEMP);
    258      1.12   thorpej 				return (EINVAL);
    259      1.12   thorpej 			}
    260      1.12   thorpej 		}
    261       1.1   thorpej 
    262      1.12   thorpej 		uio_out->uio_iovcnt = req->req_outbuf.dmbuf_iovcnt;
    263      1.12   thorpej 		uio_out->uio_resid = len;
    264      1.12   thorpej 		uio_out->uio_rw = UIO_READ;
    265      1.21      yamt 		uio_out->uio_vmspace = dus->dus_vmspace;
    266      1.21      yamt 
    267      1.12   thorpej 		dreq->dreq_outbuf_type = DMOVER_BUF_UIO;
    268      1.12   thorpej 		dreq->dreq_outbuf.dmbuf_uio = uio_out;
    269      1.12   thorpej 	} else {
    270      1.12   thorpej 		uio_out->uio_iov = NULL;
    271      1.12   thorpej 		uio_out = NULL;
    272      1.12   thorpej 		dreq->dreq_outbuf_type = DMOVER_BUF_NONE;
    273       1.1   thorpej 	}
    274       1.1   thorpej 
    275      1.12   thorpej 	memcpy(dreq->dreq_immediate, req->req_immediate,
    276      1.12   thorpej 	    sizeof(dreq->dreq_immediate));
    277       1.1   thorpej 
    278       1.1   thorpej 	if (dses->dses_ninputs == 0) {
    279      1.12   thorpej 		/* No inputs; all done. */
    280       1.1   thorpej 		return (0);
    281       1.1   thorpej 	}
    282       1.1   thorpej 
    283       1.1   thorpej 	dreq->dreq_inbuf_type = DMOVER_BUF_UIO;
    284       1.1   thorpej 
    285       1.1   thorpej 	dus->dus_uio_in = malloc(sizeof(struct uio) * dses->dses_ninputs,
    286       1.1   thorpej 	    M_TEMP, M_WAITOK);
    287       1.1   thorpej 	memset(dus->dus_uio_in, 0, sizeof(struct uio) * dses->dses_ninputs);
    288       1.1   thorpej 
    289       1.1   thorpej 	for (i = 0; i < dses->dses_ninputs; i++) {
    290       1.1   thorpej 		uio_in = &dus->dus_uio_in[i];
    291       1.1   thorpej 
    292       1.1   thorpej 		error = copyin(&req->req_inbuf[i], &inbuf, sizeof(inbuf));
    293       1.1   thorpej 		if (error)
    294       1.1   thorpej 			goto bad;
    295       1.1   thorpej 
    296       1.1   thorpej 		if (inbuf.dmbuf_iovcnt > IOV_MAX) {
    297       1.1   thorpej 			error = EINVAL;
    298       1.1   thorpej 			goto bad;
    299       1.1   thorpej 		}
    300       1.1   thorpej 		len = sizeof(struct iovec) * inbuf.dmbuf_iovcnt;
    301       1.1   thorpej 		if (len == 0) {
    302       1.1   thorpej 			error = EINVAL;
    303       1.1   thorpej 			goto bad;
    304       1.1   thorpej 		}
    305       1.1   thorpej 		uio_in->uio_iov = malloc(len, M_TEMP, M_WAITOK);
    306       1.1   thorpej 
    307       1.1   thorpej 		error = copyin(inbuf.dmbuf_iov, uio_in->uio_iov, len);
    308       1.1   thorpej 		if (error) {
    309       1.1   thorpej 			free(uio_in->uio_iov, M_TEMP);
    310       1.1   thorpej 			goto bad;
    311       1.1   thorpej 		}
    312       1.1   thorpej 
    313      1.12   thorpej 		for (j = 0, len = 0; j < inbuf.dmbuf_iovcnt; j++) {
    314       1.1   thorpej 			len += uio_in->uio_iov[j].iov_len;
    315       1.1   thorpej 			if (len > SSIZE_MAX) {
    316       1.1   thorpej 				free(uio_in->uio_iov, M_TEMP);
    317       1.1   thorpej 				error = EINVAL;
    318       1.1   thorpej 				goto bad;
    319       1.1   thorpej 			}
    320       1.1   thorpej 		}
    321       1.1   thorpej 
    322      1.12   thorpej 		if (uio_out != NULL && len != uio_out->uio_resid) {
    323       1.1   thorpej 			free(uio_in->uio_iov, M_TEMP);
    324       1.1   thorpej 			error = EINVAL;
    325       1.1   thorpej 			goto bad;
    326       1.1   thorpej 		}
    327       1.1   thorpej 
    328       1.1   thorpej 		uio_in->uio_iovcnt = inbuf.dmbuf_iovcnt;
    329       1.1   thorpej 		uio_in->uio_resid = len;
    330       1.1   thorpej 		uio_in->uio_rw = UIO_WRITE;
    331      1.21      yamt 		uio_in->uio_vmspace = dus->dus_vmspace;
    332       1.1   thorpej 
    333       1.1   thorpej 		dreq->dreq_inbuf[i].dmbuf_uio = uio_in;
    334       1.1   thorpej 	}
    335       1.1   thorpej 
    336       1.1   thorpej 	return (0);
    337       1.1   thorpej 
    338       1.1   thorpej  bad:
    339       1.1   thorpej 	if (i > 0) {
    340       1.1   thorpej 		for (--i; i >= 0; i--) {
    341       1.1   thorpej 			uio_in = &dus->dus_uio_in[i];
    342       1.1   thorpej 			free(uio_in->uio_iov, M_TEMP);
    343       1.1   thorpej 		}
    344       1.1   thorpej 	}
    345       1.1   thorpej 	free(dus->dus_uio_in, M_TEMP);
    346      1.12   thorpej 	if (uio_out != NULL)
    347      1.12   thorpej 		free(uio_out->uio_iov, M_TEMP);
    348      1.21      yamt 	uvmspace_free(dus->dus_vmspace);
    349       1.1   thorpej 	return (error);
    350       1.1   thorpej }
    351       1.1   thorpej 
    352       1.1   thorpej /*
    353       1.1   thorpej  * dmio_usrreq_fini:
    354       1.1   thorpej  *
    355       1.1   thorpej  *	Tear down a request.  Must be called at splsoftclock().
    356       1.1   thorpej  */
    357       1.1   thorpej static void
    358       1.1   thorpej dmio_usrreq_fini(struct dmio_state *ds, struct dmio_usrreq_state *dus)
    359       1.1   thorpej {
    360       1.1   thorpej 	struct dmover_session *dses = ds->ds_session;
    361       1.1   thorpej 	struct uio *uio_out = &dus->dus_uio_out;
    362       1.1   thorpej 	struct uio *uio_in;
    363       1.1   thorpej 	int i;
    364       1.1   thorpej 
    365      1.12   thorpej 	if (uio_out->uio_iov != NULL)
    366      1.12   thorpej 		free(uio_out->uio_iov, M_TEMP);
    367       1.1   thorpej 
    368      1.21      yamt 	if (dses->dses_ninputs) {
    369      1.21      yamt 		for (i = 0; i < dses->dses_ninputs; i++) {
    370      1.21      yamt 			uio_in = &dus->dus_uio_in[i];
    371      1.21      yamt 			free(uio_in->uio_iov, M_TEMP);
    372      1.21      yamt 		}
    373      1.21      yamt 		free(dus->dus_uio_in, M_TEMP);
    374       1.1   thorpej 	}
    375       1.1   thorpej 
    376      1.27     rmind 	workqueue_enqueue(dmio_cleaner, &dus->dus_work, NULL);
    377      1.21      yamt }
    378      1.21      yamt 
    379      1.21      yamt static void
    380      1.21      yamt dmio_usrreq_fini1(struct work *wk, void *dummy)
    381      1.21      yamt {
    382      1.21      yamt 	struct dmio_usrreq_state *dus = (void *)wk;
    383       1.1   thorpej 
    384      1.21      yamt 	KASSERT(wk == &dus->dus_work);
    385       1.1   thorpej 
    386      1.21      yamt 	uvmspace_free(dus->dus_vmspace);
    387       1.1   thorpej 	pool_put(&dmio_usrreq_state_pool, dus);
    388       1.1   thorpej }
    389       1.1   thorpej 
    390       1.1   thorpej /*
    391       1.1   thorpej  * dmio_read:
    392       1.1   thorpej  *
    393       1.1   thorpej  *	Read file op.
    394       1.1   thorpej  */
    395       1.1   thorpej static int
    396       1.1   thorpej dmio_read(struct file *fp, off_t *offp, struct uio *uio,
    397      1.22      elad     kauth_cred_t cred, int flags)
    398       1.1   thorpej {
    399       1.1   thorpej 	struct dmio_state *ds = (struct dmio_state *) fp->f_data;
    400       1.1   thorpej 	struct dmio_usrreq_state *dus;
    401       1.1   thorpej 	struct dmover_request *dreq;
    402       1.1   thorpej 	struct dmio_usrresp resp;
    403      1.40  jakllsch 	int error = 0, progress = 0;
    404       1.1   thorpej 
    405       1.1   thorpej 	if ((uio->uio_resid % sizeof(resp)) != 0)
    406       1.1   thorpej 		return (EINVAL);
    407       1.1   thorpej 
    408       1.1   thorpej 	if (ds->ds_session == NULL)
    409       1.1   thorpej 		return (ENXIO);
    410       1.1   thorpej 
    411      1.33  christos 	getnanotime(&ds->ds_atime);
    412      1.40  jakllsch 	mutex_enter(&ds->ds_lock);
    413       1.1   thorpej 
    414       1.1   thorpej 	while (uio->uio_resid != 0) {
    415       1.1   thorpej 
    416       1.1   thorpej 		for (;;) {
    417       1.1   thorpej 			dus = TAILQ_FIRST(&ds->ds_complete);
    418       1.1   thorpej 			if (dus == NULL) {
    419       1.1   thorpej 				if (fp->f_flag & FNONBLOCK) {
    420       1.1   thorpej 					error = progress ? 0 : EWOULDBLOCK;
    421       1.1   thorpej 					goto out;
    422       1.1   thorpej 				}
    423       1.9       scw 				ds->ds_flags |= DMIO_STATE_READ_WAIT;
    424      1.40  jakllsch 				error = cv_wait_sig(&ds->ds_complete_cv, &ds->ds_lock);
    425       1.1   thorpej 				if (error)
    426       1.1   thorpej 					goto out;
    427       1.1   thorpej 				continue;
    428       1.1   thorpej 			}
    429       1.1   thorpej 			/* Have a completed request. */
    430       1.1   thorpej 			TAILQ_REMOVE(&ds->ds_complete, dus, dus_q);
    431       1.1   thorpej 			ds->ds_nreqs--;
    432       1.1   thorpej 			if (ds->ds_flags & DMIO_STATE_WRITE_WAIT) {
    433       1.1   thorpej 				ds->ds_flags &= ~DMIO_STATE_WRITE_WAIT;
    434      1.40  jakllsch 				cv_broadcast(&ds->ds_nreqs_cv);
    435       1.1   thorpej 			}
    436       1.1   thorpej 			if (ds->ds_flags & DMIO_STATE_SEL) {
    437       1.1   thorpej 				ds->ds_flags &= ~DMIO_STATE_SEL;
    438      1.30     rmind 				selnotify(&ds->ds_selq, POLLIN | POLLRDNORM, 0);
    439       1.1   thorpej 			}
    440       1.1   thorpej 			break;
    441       1.1   thorpej 		}
    442       1.1   thorpej 
    443       1.1   thorpej 		dreq = dus->dus_req;
    444       1.1   thorpej 		resp.resp_id = dus->dus_id;
    445      1.12   thorpej 		if (dreq->dreq_flags & DMOVER_REQ_ERROR)
    446      1.12   thorpej 			resp.resp_error = dreq->dreq_error;
    447      1.12   thorpej 		else {
    448      1.12   thorpej 			resp.resp_error = 0;
    449      1.12   thorpej 			memcpy(resp.resp_immediate, dreq->dreq_immediate,
    450      1.12   thorpej 			    sizeof(resp.resp_immediate));
    451      1.12   thorpej 		}
    452       1.1   thorpej 
    453       1.1   thorpej 		dmio_usrreq_fini(ds, dus);
    454       1.1   thorpej 
    455      1.40  jakllsch 		mutex_exit(&ds->ds_lock);
    456       1.1   thorpej 
    457       1.1   thorpej 		progress = 1;
    458       1.1   thorpej 
    459       1.1   thorpej 		dmover_request_free(dreq);
    460       1.1   thorpej 
    461       1.1   thorpej 		error = uiomove(&resp, sizeof(resp), uio);
    462       1.1   thorpej 		if (error)
    463       1.1   thorpej 			return (error);
    464       1.1   thorpej 
    465      1.40  jakllsch 		mutex_enter(&ds->ds_lock);
    466       1.1   thorpej 	}
    467       1.1   thorpej 
    468       1.1   thorpej  out:
    469      1.40  jakllsch 	mutex_exit(&ds->ds_lock);
    470       1.1   thorpej 
    471       1.1   thorpej 	return (error);
    472       1.1   thorpej }
    473       1.1   thorpej 
    474       1.1   thorpej /*
    475       1.1   thorpej  * dmio_usrreq_done:
    476       1.1   thorpej  *
    477       1.1   thorpej  *	Dmover completion callback.
    478       1.1   thorpej  */
    479       1.1   thorpej static void
    480       1.1   thorpej dmio_usrreq_done(struct dmover_request *dreq)
    481       1.1   thorpej {
    482       1.1   thorpej 	struct dmio_usrreq_state *dus = dreq->dreq_cookie;
    483       1.1   thorpej 	struct dmio_state *ds = dreq->dreq_session->dses_cookie;
    484       1.1   thorpej 
    485       1.1   thorpej 	/* We're already at splsoftclock(). */
    486       1.1   thorpej 
    487      1.40  jakllsch 	mutex_enter(&ds->ds_lock);
    488       1.1   thorpej 	TAILQ_REMOVE(&ds->ds_pending, dus, dus_q);
    489       1.1   thorpej 	if (ds->ds_flags & DMIO_STATE_DEAD) {
    490      1.40  jakllsch 		int nreqs = --ds->ds_nreqs;
    491      1.40  jakllsch 		mutex_exit(&ds->ds_lock);
    492       1.1   thorpej 		dmio_usrreq_fini(ds, dus);
    493       1.1   thorpej 		dmover_request_free(dreq);
    494      1.40  jakllsch 		if (nreqs == 0) {
    495      1.40  jakllsch 			dmio_state_put(ds);
    496       1.1   thorpej 		}
    497      1.40  jakllsch 		return;
    498      1.40  jakllsch 	}
    499      1.40  jakllsch 
    500      1.40  jakllsch 	TAILQ_INSERT_TAIL(&ds->ds_complete, dus, dus_q);
    501      1.40  jakllsch 	if (ds->ds_flags & DMIO_STATE_READ_WAIT) {
    502      1.40  jakllsch 		ds->ds_flags &= ~DMIO_STATE_READ_WAIT;
    503      1.40  jakllsch 		cv_broadcast(&ds->ds_complete_cv);
    504      1.40  jakllsch 	}
    505      1.40  jakllsch 	if (ds->ds_flags & DMIO_STATE_SEL) {
    506      1.40  jakllsch 		ds->ds_flags &= ~DMIO_STATE_SEL;
    507      1.40  jakllsch 		selnotify(&ds->ds_selq, POLLOUT | POLLWRNORM, 0);
    508       1.1   thorpej 	}
    509      1.40  jakllsch 	mutex_exit(&ds->ds_lock);
    510       1.1   thorpej }
    511       1.1   thorpej 
    512       1.1   thorpej /*
    513       1.1   thorpej  * dmio_write:
    514       1.1   thorpej  *
    515       1.1   thorpej  *	Write file op.
    516       1.1   thorpej  */
    517       1.1   thorpej static int
    518       1.1   thorpej dmio_write(struct file *fp, off_t *offp, struct uio *uio,
    519      1.22      elad     kauth_cred_t cred, int flags)
    520       1.1   thorpej {
    521       1.1   thorpej 	struct dmio_state *ds = (struct dmio_state *) fp->f_data;
    522       1.1   thorpej 	struct dmio_usrreq_state *dus;
    523       1.1   thorpej 	struct dmover_request *dreq;
    524       1.1   thorpej 	struct dmio_usrreq req;
    525      1.40  jakllsch 	int error = 0, progress = 0;
    526       1.1   thorpej 
    527       1.1   thorpej 	if ((uio->uio_resid % sizeof(req)) != 0)
    528       1.1   thorpej 		return (EINVAL);
    529       1.1   thorpej 
    530       1.1   thorpej 	if (ds->ds_session == NULL)
    531       1.1   thorpej 		return (ENXIO);
    532       1.1   thorpej 
    533      1.33  christos 	getnanotime(&ds->ds_mtime);
    534      1.40  jakllsch 	mutex_enter(&ds->ds_lock);
    535       1.1   thorpej 
    536       1.1   thorpej 	while (uio->uio_resid != 0) {
    537       1.1   thorpej 
    538       1.1   thorpej 		if (ds->ds_nreqs == DMIO_NREQS_MAX) {
    539       1.1   thorpej 			if (fp->f_flag & FNONBLOCK) {
    540       1.1   thorpej 				error = progress ? 0 : EWOULDBLOCK;
    541       1.1   thorpej 				break;
    542       1.1   thorpej 			}
    543       1.1   thorpej 			ds->ds_flags |= DMIO_STATE_WRITE_WAIT;
    544      1.40  jakllsch 			error = cv_wait_sig(&ds->ds_complete_cv, &ds->ds_lock);
    545       1.1   thorpej 			if (error)
    546       1.1   thorpej 				break;
    547       1.1   thorpej 			continue;
    548       1.1   thorpej 		}
    549       1.1   thorpej 
    550       1.1   thorpej 		ds->ds_nreqs++;
    551       1.1   thorpej 
    552      1.40  jakllsch 		mutex_exit(&ds->ds_lock);
    553       1.1   thorpej 
    554       1.1   thorpej 		progress = 1;
    555       1.1   thorpej 
    556       1.1   thorpej 		error = uiomove(&req, sizeof(req), uio);
    557       1.1   thorpej 		if (error) {
    558      1.40  jakllsch 			mutex_enter(&ds->ds_lock);
    559       1.1   thorpej 			ds->ds_nreqs--;
    560       1.1   thorpej 			break;
    561       1.1   thorpej 		}
    562       1.1   thorpej 
    563       1.1   thorpej 		/* XXX How should this interact with FNONBLOCK? */
    564       1.1   thorpej 		dreq = dmover_request_alloc(ds->ds_session, NULL);
    565       1.1   thorpej 		if (dreq == NULL) {
    566       1.1   thorpej 			/* XXX */
    567       1.1   thorpej 			ds->ds_nreqs--;
    568       1.1   thorpej 			error = ENOMEM;
    569      1.40  jakllsch 			return error;
    570       1.1   thorpej 		}
    571       1.1   thorpej 		dus = pool_get(&dmio_usrreq_state_pool, PR_WAITOK);
    572       1.1   thorpej 
    573       1.1   thorpej 		error = dmio_usrreq_init(fp, dus, &req, dreq);
    574       1.1   thorpej 		if (error) {
    575       1.1   thorpej 			dmover_request_free(dreq);
    576       1.1   thorpej 			pool_put(&dmio_usrreq_state_pool, dus);
    577      1.40  jakllsch 			return error;
    578       1.1   thorpej 		}
    579       1.1   thorpej 
    580       1.1   thorpej 		dreq->dreq_callback = dmio_usrreq_done;
    581       1.1   thorpej 		dreq->dreq_cookie = dus;
    582       1.1   thorpej 
    583       1.1   thorpej 		dus->dus_req = dreq;
    584       1.1   thorpej 		dus->dus_id = req.req_id;
    585       1.1   thorpej 
    586      1.40  jakllsch 		mutex_enter(&ds->ds_lock);
    587       1.1   thorpej 
    588       1.1   thorpej 		TAILQ_INSERT_TAIL(&ds->ds_pending, dus, dus_q);
    589       1.1   thorpej 
    590      1.40  jakllsch 		mutex_exit(&ds->ds_lock);
    591       1.1   thorpej 
    592       1.1   thorpej 		dmover_process(dreq);
    593       1.1   thorpej 
    594      1.40  jakllsch 		mutex_enter(&ds->ds_lock);
    595       1.1   thorpej 	}
    596       1.1   thorpej 
    597      1.40  jakllsch 	mutex_exit(&ds->ds_lock);
    598       1.1   thorpej 
    599       1.1   thorpej 	return (error);
    600       1.1   thorpej }
    601       1.1   thorpej 
    602      1.33  christos static int
    603      1.33  christos dmio_stat(struct file *fp, struct stat *st)
    604      1.33  christos {
    605      1.33  christos 	struct dmio_state *ds = fp->f_data;
    606      1.33  christos 
    607      1.41   msaitoh 	(void)memset(st, 0, sizeof(*st));
    608      1.33  christos 	KERNEL_LOCK(1, NULL);
    609      1.33  christos 	st->st_dev = makedev(cdevsw_lookup_major(&dmoverio_cdevsw), 0);
    610      1.35    nonaka 	st->st_atimespec = ds->ds_atime;
    611      1.35    nonaka 	st->st_mtimespec = ds->ds_mtime;
    612      1.35    nonaka 	st->st_ctimespec = st->st_birthtimespec = ds->ds_btime;
    613      1.34  christos 	st->st_uid = kauth_cred_geteuid(fp->f_cred);
    614      1.34  christos 	st->st_gid = kauth_cred_getegid(fp->f_cred);
    615      1.35    nonaka 	KERNEL_UNLOCK_ONE(NULL);
    616      1.33  christos 	return 0;
    617      1.33  christos }
    618      1.33  christos 
    619       1.1   thorpej /*
    620       1.1   thorpej  * dmio_ioctl:
    621       1.1   thorpej  *
    622       1.1   thorpej  *	Ioctl file op.
    623       1.1   thorpej  */
    624       1.1   thorpej static int
    625      1.31        ad dmio_ioctl(struct file *fp, u_long cmd, void *data)
    626       1.1   thorpej {
    627       1.1   thorpej 	struct dmio_state *ds = (struct dmio_state *) fp->f_data;
    628      1.40  jakllsch 	int error;
    629       1.1   thorpej 
    630       1.1   thorpej 	switch (cmd) {
    631       1.1   thorpej 	case FIONBIO:
    632       1.1   thorpej 	case FIOASYNC:
    633       1.1   thorpej 		return (0);
    634       1.1   thorpej 
    635       1.1   thorpej 	case DMIO_SETFUNC:
    636       1.1   thorpej 	    {
    637       1.8       dsl 		struct dmio_setfunc *dsf = data;
    638       1.1   thorpej 		struct dmover_session *dses;
    639       1.1   thorpej 
    640      1.40  jakllsch 		mutex_enter(&ds->ds_lock);
    641       1.1   thorpej 
    642       1.1   thorpej 		if (ds->ds_session != NULL ||
    643       1.1   thorpej 		    (ds->ds_flags & DMIO_STATE_LARVAL) != 0) {
    644      1.40  jakllsch 			mutex_exit(&ds->ds_lock);
    645       1.1   thorpej 			return (EBUSY);
    646       1.1   thorpej 		}
    647       1.1   thorpej 
    648       1.1   thorpej 		ds->ds_flags |= DMIO_STATE_LARVAL;
    649       1.1   thorpej 
    650      1.40  jakllsch 		mutex_exit(&ds->ds_lock);
    651       1.1   thorpej 
    652       1.1   thorpej 		dsf->dsf_name[DMIO_MAX_FUNCNAME - 1] = '\0';
    653       1.1   thorpej 		error = dmover_session_create(dsf->dsf_name, &dses);
    654       1.1   thorpej 
    655      1.40  jakllsch 		mutex_enter(&ds->ds_lock);
    656       1.1   thorpej 
    657       1.1   thorpej 		if (error == 0) {
    658       1.1   thorpej 			dses->dses_cookie = ds;
    659       1.1   thorpej 			ds->ds_session = dses;
    660       1.1   thorpej 		}
    661       1.1   thorpej 		ds->ds_flags &= ~DMIO_STATE_LARVAL;
    662       1.1   thorpej 
    663      1.40  jakllsch 		mutex_exit(&ds->ds_lock);
    664       1.1   thorpej 		break;
    665       1.1   thorpej 	    }
    666       1.1   thorpej 
    667       1.1   thorpej 	default:
    668       1.1   thorpej 		error = ENOTTY;
    669       1.1   thorpej 	}
    670       1.1   thorpej 
    671       1.1   thorpej 	return (error);
    672       1.1   thorpej }
    673       1.1   thorpej 
    674       1.1   thorpej /*
    675       1.1   thorpej  * dmio_poll:
    676       1.1   thorpej  *
    677       1.1   thorpej  *	Poll file op.
    678       1.1   thorpej  */
    679       1.1   thorpej static int
    680      1.31        ad dmio_poll(struct file *fp, int events)
    681       1.1   thorpej {
    682       1.1   thorpej 	struct dmio_state *ds = (struct dmio_state *) fp->f_data;
    683      1.40  jakllsch 	int revents = 0;
    684       1.1   thorpej 
    685       1.1   thorpej 	if ((events & (POLLIN | POLLRDNORM | POLLOUT | POLLWRNORM)) == 0)
    686       1.1   thorpej 		return (revents);
    687       1.1   thorpej 
    688      1.40  jakllsch 	mutex_enter(&ds->ds_lock);
    689       1.1   thorpej 
    690       1.1   thorpej 	if (ds->ds_flags & DMIO_STATE_DEAD) {
    691       1.1   thorpej 		/* EOF */
    692       1.1   thorpej 		revents |= events & (POLLIN | POLLRDNORM |
    693       1.1   thorpej 		    POLLOUT | POLLWRNORM);
    694       1.1   thorpej 		goto out;
    695       1.1   thorpej 	}
    696       1.1   thorpej 
    697       1.1   thorpej 	/* We can read if there are completed requests. */
    698       1.1   thorpej 	if (events & (POLLIN | POLLRDNORM))
    699       1.1   thorpej 		if (TAILQ_EMPTY(&ds->ds_complete) == 0)
    700       1.1   thorpej 			revents |= events & (POLLIN | POLLRDNORM);
    701       1.1   thorpej 
    702       1.1   thorpej 	/*
    703       1.1   thorpej 	 * We can write if there is there are fewer then DMIO_NREQS_MAX
    704       1.1   thorpej 	 * are already in the queue.
    705       1.1   thorpej 	 */
    706       1.1   thorpej 	if (events & (POLLOUT | POLLWRNORM))
    707       1.1   thorpej 		if (ds->ds_nreqs < DMIO_NREQS_MAX)
    708       1.1   thorpej 			revents |= events & (POLLOUT | POLLWRNORM);
    709       1.1   thorpej 
    710       1.1   thorpej 	if (revents == 0) {
    711      1.31        ad 		selrecord(curlwp, &ds->ds_selq);
    712       1.1   thorpej 		ds->ds_flags |= DMIO_STATE_SEL;
    713       1.1   thorpej 	}
    714       1.1   thorpej 
    715       1.1   thorpej  out:
    716      1.40  jakllsch 	mutex_exit(&ds->ds_lock);
    717       1.1   thorpej 
    718       1.1   thorpej 	return (revents);
    719       1.1   thorpej }
    720       1.1   thorpej 
    721       1.1   thorpej /*
    722       1.1   thorpej  * dmio_close:
    723       1.1   thorpej  *
    724       1.1   thorpej  *	Close file op.
    725       1.1   thorpej  */
    726       1.1   thorpej static int
    727      1.31        ad dmio_close(struct file *fp)
    728       1.1   thorpej {
    729       1.1   thorpej 	struct dmio_state *ds = (struct dmio_state *) fp->f_data;
    730       1.1   thorpej 	struct dmio_usrreq_state *dus;
    731       1.1   thorpej 	struct dmover_session *dses;
    732       1.1   thorpej 
    733      1.40  jakllsch 	mutex_enter(&ds->ds_lock);
    734       1.1   thorpej 
    735       1.1   thorpej 	ds->ds_flags |= DMIO_STATE_DEAD;
    736       1.1   thorpej 
    737       1.1   thorpej 	/* Garbage-collect all the responses on the queue. */
    738       1.1   thorpej 	while ((dus = TAILQ_FIRST(&ds->ds_complete)) != NULL) {
    739       1.1   thorpej 		TAILQ_REMOVE(&ds->ds_complete, dus, dus_q);
    740       1.1   thorpej 		ds->ds_nreqs--;
    741      1.40  jakllsch 		mutex_exit(&ds->ds_lock);
    742       1.1   thorpej 		dmover_request_free(dus->dus_req);
    743       1.1   thorpej 		dmio_usrreq_fini(ds, dus);
    744      1.40  jakllsch 		mutex_enter(&ds->ds_lock);
    745       1.1   thorpej 	}
    746       1.1   thorpej 
    747       1.1   thorpej 	/*
    748       1.1   thorpej 	 * If there are any requests pending, we have to wait for
    749       1.1   thorpej 	 * them.  Don't free the dmio_state in this case.
    750       1.1   thorpej 	 */
    751       1.1   thorpej 	if (ds->ds_nreqs == 0) {
    752       1.1   thorpej 		dses = ds->ds_session;
    753      1.40  jakllsch 		mutex_exit(&ds->ds_lock);
    754      1.40  jakllsch 		dmio_state_put(ds);
    755       1.1   thorpej 	} else {
    756       1.1   thorpej 		dses = NULL;
    757      1.40  jakllsch 		mutex_exit(&ds->ds_lock);
    758       1.1   thorpej 	}
    759       1.1   thorpej 
    760       1.1   thorpej 	fp->f_data = NULL;
    761       1.1   thorpej 
    762       1.1   thorpej 	if (dses != NULL)
    763       1.1   thorpej 		dmover_session_destroy(dses);
    764       1.1   thorpej 
    765       1.1   thorpej 	return (0);
    766       1.1   thorpej }
    767       1.1   thorpej 
    768      1.15  christos static const struct fileops dmio_fileops = {
    769      1.32        ad 	.fo_read = dmio_read,
    770      1.32        ad 	.fo_write = dmio_write,
    771      1.32        ad 	.fo_ioctl = dmio_ioctl,
    772      1.32        ad 	.fo_fcntl = fnullop_fcntl,
    773      1.32        ad 	.fo_poll = dmio_poll,
    774      1.33  christos 	.fo_stat = dmio_stat,
    775      1.32        ad 	.fo_close = dmio_close,
    776      1.32        ad 	.fo_kqfilter = fnullop_kqfilter,
    777      1.37       dsl 	.fo_restart = fnullop_restart,
    778       1.1   thorpej };
    779       1.1   thorpej 
    780       1.1   thorpej /*
    781       1.1   thorpej  * dmoverioopen:
    782       1.1   thorpej  *
    783       1.1   thorpej  *	Device switch open routine.
    784       1.1   thorpej  */
    785       1.1   thorpej int
    786      1.18  christos dmoverioopen(dev_t dev, int flag, int mode, struct lwp *l)
    787       1.1   thorpej {
    788       1.1   thorpej 	struct dmio_state *ds;
    789       1.1   thorpej 	struct file *fp;
    790      1.40  jakllsch 	int error, fd;
    791       1.1   thorpej 
    792      1.31        ad 	if ((error = fd_allocfile(&fp, &fd)) != 0)
    793       1.1   thorpej 		return (error);
    794       1.1   thorpej 
    795      1.40  jakllsch 	ds = dmio_state_get();
    796       1.1   thorpej 
    797      1.31        ad 	return fd_clone(fp, fd, flag, &dmio_fileops, ds);
    798       1.1   thorpej }
    799