Home | History | Annotate | Line # | Download | only in ext2fs
ext2fs_readwrite.c revision 1.16
      1  1.16       chs /*	$NetBSD: ext2fs_readwrite.c,v 1.16 2001/02/27 04:37:47 chs Exp $	*/
      2   1.1    bouyer 
      3   1.1    bouyer /*-
      4   1.1    bouyer  * Copyright (c) 1997 Manuel Bouyer.
      5   1.1    bouyer  * Copyright (c) 1993
      6   1.1    bouyer  *	The Regents of the University of California.  All rights reserved.
      7   1.1    bouyer  *
      8   1.1    bouyer  * Redistribution and use in source and binary forms, with or without
      9   1.1    bouyer  * modification, are permitted provided that the following conditions
     10   1.1    bouyer  * are met:
     11   1.1    bouyer  * 1. Redistributions of source code must retain the above copyright
     12   1.1    bouyer  *    notice, this list of conditions and the following disclaimer.
     13   1.1    bouyer  * 2. Redistributions in binary form must reproduce the above copyright
     14   1.1    bouyer  *    notice, this list of conditions and the following disclaimer in the
     15   1.1    bouyer  *    documentation and/or other materials provided with the distribution.
     16   1.1    bouyer  * 3. All advertising materials mentioning features or use of this software
     17   1.1    bouyer  *    must display the following acknowledgement:
     18   1.1    bouyer  *	This product includes software developed by the University of
     19   1.1    bouyer  *	California, Berkeley and its contributors.
     20   1.1    bouyer  * 4. Neither the name of the University nor the names of its contributors
     21   1.1    bouyer  *    may be used to endorse or promote products derived from this software
     22   1.1    bouyer  *    without specific prior written permission.
     23   1.1    bouyer  *
     24   1.1    bouyer  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     25   1.1    bouyer  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     26   1.1    bouyer  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     27   1.1    bouyer  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     28   1.1    bouyer  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     29   1.1    bouyer  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     30   1.1    bouyer  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     31   1.1    bouyer  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     32   1.1    bouyer  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     33   1.1    bouyer  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     34   1.1    bouyer  * SUCH DAMAGE.
     35   1.1    bouyer  *
     36   1.1    bouyer  *	@(#)ufs_readwrite.c	8.8 (Berkeley) 8/4/94
     37   1.1    bouyer  * Modified for ext2fs by Manuel Bouyer.
     38   1.1    bouyer  */
     39   1.5       mrg 
     40   1.1    bouyer #include <sys/param.h>
     41   1.1    bouyer #include <sys/systm.h>
     42   1.1    bouyer #include <sys/resourcevar.h>
     43   1.1    bouyer #include <sys/kernel.h>
     44   1.1    bouyer #include <sys/file.h>
     45   1.1    bouyer #include <sys/stat.h>
     46   1.1    bouyer #include <sys/buf.h>
     47   1.1    bouyer #include <sys/proc.h>
     48   1.1    bouyer #include <sys/conf.h>
     49   1.1    bouyer #include <sys/mount.h>
     50   1.1    bouyer #include <sys/vnode.h>
     51   1.1    bouyer #include <sys/malloc.h>
     52   1.1    bouyer #include <sys/signalvar.h>
     53   1.1    bouyer 
     54   1.1    bouyer #include <ufs/ufs/quota.h>
     55   1.1    bouyer #include <ufs/ufs/inode.h>
     56   1.1    bouyer #include <ufs/ext2fs/ext2fs.h>
     57   1.1    bouyer #include <ufs/ext2fs/ext2fs_extern.h>
     58   1.1    bouyer 
     59   1.1    bouyer 
     60   1.1    bouyer #define doclusterread 0 /* XXX underway */
     61   1.1    bouyer #define doclusterwrite 0
     62   1.1    bouyer 
     63   1.1    bouyer /*
     64   1.1    bouyer  * Vnode op for reading.
     65   1.1    bouyer  */
     66   1.1    bouyer /* ARGSUSED */
     67   1.1    bouyer int
     68   1.1    bouyer ext2fs_read(v)
     69   1.1    bouyer 	void *v;
     70   1.1    bouyer {
     71   1.1    bouyer 	struct vop_read_args /* {
     72   1.1    bouyer 		struct vnode *a_vp;
     73   1.1    bouyer 		struct uio *a_uio;
     74   1.1    bouyer 		int a_ioflag;
     75   1.1    bouyer 		struct ucred *a_cred;
     76   1.1    bouyer 	} */ *ap = v;
     77  1.11  augustss 	struct vnode *vp;
     78  1.11  augustss 	struct inode *ip;
     79  1.11  augustss 	struct uio *uio;
     80  1.11  augustss 	struct m_ext2fs *fs;
     81   1.1    bouyer 	struct buf *bp;
     82  1.14       chs 	void *win;
     83  1.14       chs 	vsize_t bytelen;
     84   1.6      fvdl 	ufs_daddr_t lbn, nextlbn;
     85   1.1    bouyer 	off_t bytesinfile;
     86   1.1    bouyer 	long size, xfersize, blkoffset;
     87   1.1    bouyer 	int error;
     88   1.1    bouyer 
     89   1.1    bouyer 	vp = ap->a_vp;
     90   1.1    bouyer 	ip = VTOI(vp);
     91   1.1    bouyer 	uio = ap->a_uio;
     92   1.1    bouyer 
     93   1.1    bouyer #ifdef DIAGNOSTIC
     94   1.1    bouyer 	if (uio->uio_rw != UIO_READ)
     95   1.1    bouyer 		panic("%s: mode", "ext2fs_read");
     96   1.1    bouyer 
     97   1.1    bouyer 	if (vp->v_type == VLNK) {
     98   1.1    bouyer 		if ((int)ip->i_e2fs_size < vp->v_mount->mnt_maxsymlinklen ||
     99   1.1    bouyer 			(vp->v_mount->mnt_maxsymlinklen == 0 &&
    100   1.1    bouyer 			 ip->i_e2fs_nblock == 0))
    101   1.1    bouyer 			panic("%s: short symlink", "ext2fs_read");
    102   1.1    bouyer 	} else if (vp->v_type != VREG && vp->v_type != VDIR)
    103   1.1    bouyer 		panic("%s: type %d", "ext2fs_read", vp->v_type);
    104   1.1    bouyer #endif
    105   1.1    bouyer 	fs = ip->i_e2fs;
    106   1.1    bouyer 	if ((u_int64_t)uio->uio_offset >
    107   1.1    bouyer 		((u_int64_t)0x80000000 * fs->e2fs_bsize - 1))
    108   1.1    bouyer 		return (EFBIG);
    109   1.1    bouyer 	if (uio->uio_resid == 0)
    110   1.1    bouyer 		return (0);
    111   1.1    bouyer 
    112  1.14       chs 	if (vp->v_type == VREG) {
    113  1.14       chs 		error = 0;
    114  1.14       chs 		while (uio->uio_resid > 0) {
    115  1.14       chs 
    116  1.16       chs 			bytelen = MIN(ip->i_e2fs_size - uio->uio_offset,
    117  1.14       chs 			    uio->uio_resid);
    118  1.14       chs 
    119  1.14       chs 			if (bytelen == 0) {
    120  1.14       chs 				break;
    121  1.14       chs 			}
    122  1.14       chs 			win = ubc_alloc(&vp->v_uvm.u_obj, uio->uio_offset,
    123  1.14       chs 					&bytelen, UBC_READ);
    124  1.14       chs 			error = uiomove(win, bytelen, uio);
    125  1.14       chs 			ubc_release(win, 0);
    126  1.14       chs 			if (error) {
    127  1.14       chs 				break;
    128  1.14       chs 			}
    129  1.14       chs 		}
    130  1.14       chs 		goto out;
    131  1.14       chs 	}
    132  1.14       chs 
    133   1.1    bouyer 	for (error = 0, bp = NULL; uio->uio_resid > 0; bp = NULL) {
    134   1.1    bouyer 		if ((bytesinfile = ip->i_e2fs_size - uio->uio_offset) <= 0)
    135   1.1    bouyer 			break;
    136   1.1    bouyer 		lbn = lblkno(fs, uio->uio_offset);
    137   1.1    bouyer 		nextlbn = lbn + 1;
    138   1.1    bouyer 		size = fs->e2fs_bsize;
    139   1.1    bouyer 		blkoffset = blkoff(fs, uio->uio_offset);
    140   1.1    bouyer 		xfersize = fs->e2fs_bsize - blkoffset;
    141   1.1    bouyer 		if (uio->uio_resid < xfersize)
    142   1.1    bouyer 			xfersize = uio->uio_resid;
    143   1.1    bouyer 		if (bytesinfile < xfersize)
    144   1.1    bouyer 			xfersize = bytesinfile;
    145   1.1    bouyer 
    146   1.1    bouyer 		if (lblktosize(fs, nextlbn) >= ip->i_e2fs_size)
    147   1.1    bouyer 			error = bread(vp, lbn, size, NOCRED, &bp);
    148   1.1    bouyer 		else if (doclusterread)
    149   1.1    bouyer 			error = cluster_read(vp,
    150   1.1    bouyer 				ip->i_e2fs_size, lbn, size, NOCRED, &bp);
    151   1.1    bouyer 		else if (lbn - 1 == vp->v_lastr) {
    152   1.1    bouyer 			int nextsize = fs->e2fs_bsize;
    153   1.1    bouyer 			error = breadn(vp, lbn,
    154   1.1    bouyer 				size, &nextlbn, &nextsize, 1, NOCRED, &bp);
    155   1.1    bouyer 		} else
    156   1.1    bouyer 			error = bread(vp, lbn, size, NOCRED, &bp);
    157   1.1    bouyer 		if (error)
    158   1.1    bouyer 			break;
    159   1.1    bouyer 		vp->v_lastr = lbn;
    160   1.1    bouyer 
    161   1.1    bouyer 		/*
    162   1.1    bouyer 		 * We should only get non-zero b_resid when an I/O error
    163   1.1    bouyer 		 * has occurred, which should cause us to break above.
    164   1.1    bouyer 		 * However, if the short read did not cause an error,
    165   1.1    bouyer 		 * then we want to ensure that we do not uiomove bad
    166   1.1    bouyer 		 * or uninitialized data.
    167   1.1    bouyer 		 */
    168   1.1    bouyer 		size -= bp->b_resid;
    169   1.1    bouyer 		if (size < xfersize) {
    170   1.1    bouyer 			if (size == 0)
    171   1.1    bouyer 				break;
    172   1.1    bouyer 			xfersize = size;
    173   1.1    bouyer 		}
    174  1.14       chs 		error = uiomove((char *)bp->b_data + blkoffset, xfersize, uio);
    175   1.1    bouyer 		if (error)
    176   1.1    bouyer 			break;
    177   1.1    bouyer 		brelse(bp);
    178   1.1    bouyer 	}
    179   1.1    bouyer 	if (bp != NULL)
    180   1.1    bouyer 		brelse(bp);
    181  1.14       chs 
    182  1.14       chs out:
    183   1.7    kleink 	if (!(vp->v_mount->mnt_flag & MNT_NOATIME)) {
    184   1.1    bouyer 		ip->i_flag |= IN_ACCESS;
    185   1.9   mycroft 		if ((ap->a_ioflag & IO_SYNC) == IO_SYNC)
    186  1.12  perseant 			error = VOP_UPDATE(vp, NULL, NULL, UPDATE_WAIT);
    187   1.7    kleink 	}
    188   1.1    bouyer 	return (error);
    189   1.1    bouyer }
    190   1.1    bouyer 
    191   1.1    bouyer /*
    192   1.1    bouyer  * Vnode op for writing.
    193   1.1    bouyer  */
    194   1.1    bouyer int
    195   1.1    bouyer ext2fs_write(v)
    196   1.1    bouyer 	void *v;
    197   1.1    bouyer {
    198   1.1    bouyer 	struct vop_write_args /* {
    199   1.1    bouyer 		struct vnode *a_vp;
    200   1.1    bouyer 		struct uio *a_uio;
    201   1.1    bouyer 		int a_ioflag;
    202   1.1    bouyer 		struct ucred *a_cred;
    203   1.1    bouyer 	} */ *ap = v;
    204  1.11  augustss 	struct vnode *vp;
    205  1.11  augustss 	struct uio *uio;
    206  1.11  augustss 	struct inode *ip;
    207  1.11  augustss 	struct m_ext2fs *fs;
    208   1.1    bouyer 	struct buf *bp;
    209   1.1    bouyer 	struct proc *p;
    210   1.6      fvdl 	ufs_daddr_t lbn;
    211   1.1    bouyer 	off_t osize;
    212  1.14       chs 	int blkoffset, error, flags, ioflag, resid, xfersize;
    213  1.14       chs 	vsize_t bytelen;
    214  1.14       chs 	void *win;
    215  1.14       chs 	off_t oldoff;
    216  1.14       chs 	boolean_t rv;
    217   1.1    bouyer 
    218   1.1    bouyer 	ioflag = ap->a_ioflag;
    219   1.1    bouyer 	uio = ap->a_uio;
    220   1.1    bouyer 	vp = ap->a_vp;
    221   1.1    bouyer 	ip = VTOI(vp);
    222  1.14       chs 	error = 0;
    223   1.1    bouyer 
    224   1.1    bouyer #ifdef DIAGNOSTIC
    225   1.1    bouyer 	if (uio->uio_rw != UIO_WRITE)
    226   1.1    bouyer 		panic("%s: mode", "ext2fs_write");
    227   1.1    bouyer #endif
    228   1.1    bouyer 
    229   1.1    bouyer 	switch (vp->v_type) {
    230   1.1    bouyer 	case VREG:
    231   1.1    bouyer 		if (ioflag & IO_APPEND)
    232   1.1    bouyer 			uio->uio_offset = ip->i_e2fs_size;
    233   1.1    bouyer 		if ((ip->i_e2fs_flags & EXT2_APPEND) &&
    234   1.1    bouyer 			uio->uio_offset != ip->i_e2fs_size)
    235   1.1    bouyer 			return (EPERM);
    236   1.1    bouyer 		/* FALLTHROUGH */
    237   1.1    bouyer 	case VLNK:
    238   1.1    bouyer 		break;
    239   1.1    bouyer 	case VDIR:
    240   1.1    bouyer 		if ((ioflag & IO_SYNC) == 0)
    241   1.1    bouyer 			panic("%s: nonsync dir write", "ext2fs_write");
    242   1.1    bouyer 		break;
    243   1.1    bouyer 	default:
    244   1.1    bouyer 		panic("%s: type", "ext2fs_write");
    245   1.1    bouyer 	}
    246   1.1    bouyer 
    247   1.1    bouyer 	fs = ip->i_e2fs;
    248   1.1    bouyer 	if (uio->uio_offset < 0 ||
    249   1.1    bouyer 		(u_int64_t)uio->uio_offset + uio->uio_resid >
    250   1.1    bouyer 		((u_int64_t)0x80000000 * fs->e2fs_bsize - 1))
    251   1.1    bouyer 		return (EFBIG);
    252   1.1    bouyer 	/*
    253   1.1    bouyer 	 * Maybe this should be above the vnode op call, but so long as
    254   1.1    bouyer 	 * file servers have no limits, I don't think it matters.
    255   1.1    bouyer 	 */
    256   1.1    bouyer 	p = uio->uio_procp;
    257   1.1    bouyer 	if (vp->v_type == VREG && p &&
    258   1.1    bouyer 		uio->uio_offset + uio->uio_resid >
    259   1.1    bouyer 		p->p_rlimit[RLIMIT_FSIZE].rlim_cur) {
    260   1.1    bouyer 		psignal(p, SIGXFSZ);
    261   1.1    bouyer 		return (EFBIG);
    262   1.1    bouyer 	}
    263   1.1    bouyer 
    264   1.1    bouyer 	resid = uio->uio_resid;
    265   1.1    bouyer 	osize = ip->i_e2fs_size;
    266  1.14       chs 
    267  1.14       chs 	if (vp->v_type == VREG) {
    268  1.14       chs 		while (uio->uio_resid > 0) {
    269  1.14       chs 			oldoff = uio->uio_offset;
    270  1.14       chs 			blkoffset = blkoff(fs, uio->uio_offset);
    271  1.16       chs 			bytelen = MIN(fs->e2fs_bsize - blkoffset,
    272  1.14       chs 			    uio->uio_resid);
    273  1.14       chs 
    274  1.14       chs 			/*
    275  1.14       chs 			 * XXXUBC if file is mapped and this is the last block,
    276  1.14       chs 			 * process one page at a time.
    277  1.14       chs 			 */
    278  1.14       chs 
    279  1.14       chs 			error = ext2fs_balloc_range(vp, uio->uio_offset,
    280  1.14       chs 			    bytelen, ap->a_cred, 0);
    281  1.14       chs 			if (error) {
    282  1.14       chs 				break;
    283  1.14       chs 			}
    284  1.14       chs 			win = ubc_alloc(&vp->v_uvm.u_obj, uio->uio_offset,
    285  1.14       chs 			    &bytelen, UBC_WRITE);
    286  1.14       chs 			error = uiomove(win, bytelen, uio);
    287  1.14       chs 			ubc_release(win, 0);
    288  1.14       chs 			if (error) {
    289  1.14       chs 				break;
    290  1.14       chs 			}
    291  1.14       chs 
    292  1.14       chs 			/*
    293  1.14       chs 			 * flush what we just wrote if necessary.
    294  1.14       chs 			 * XXXUBC simplistic async flushing.
    295  1.14       chs 			 */
    296  1.14       chs 
    297  1.14       chs 			if (oldoff >> 16 != uio->uio_offset >> 16) {
    298  1.14       chs 				simple_lock(&vp->v_uvm.u_obj.vmobjlock);
    299  1.14       chs 				rv = vp->v_uvm.u_obj.pgops->pgo_flush(
    300  1.14       chs 				    &vp->v_uvm.u_obj, (oldoff >> 16) << 16,
    301  1.14       chs 				    (uio->uio_offset >> 16) << 16, PGO_CLEANIT);
    302  1.14       chs 				simple_unlock(&vp->v_uvm.u_obj.vmobjlock);
    303  1.14       chs 			}
    304  1.14       chs 		}
    305  1.14       chs 		goto out;
    306  1.14       chs 	}
    307  1.14       chs 
    308   1.1    bouyer 	flags = ioflag & IO_SYNC ? B_SYNC : 0;
    309   1.1    bouyer 	for (error = 0; uio->uio_resid > 0;) {
    310   1.1    bouyer 		lbn = lblkno(fs, uio->uio_offset);
    311   1.1    bouyer 		blkoffset = blkoff(fs, uio->uio_offset);
    312  1.16       chs 		xfersize = MIN(fs->e2fs_bsize - blkoffset, uio->uio_resid);
    313  1.14       chs 		if (xfersize < fs->e2fs_bsize)
    314   1.1    bouyer 			flags |= B_CLRBUF;
    315   1.1    bouyer 		else
    316   1.1    bouyer 			flags &= ~B_CLRBUF;
    317  1.15       chs 		error = ext2fs_balloc(ip,
    318  1.15       chs 		    lbn, blkoffset + xfersize, ap->a_cred, &bp, flags);
    319   1.1    bouyer 		if (error)
    320   1.1    bouyer 			break;
    321  1.14       chs 		if (ip->i_e2fs_size < uio->uio_offset + xfersize) {
    322   1.1    bouyer 			ip->i_e2fs_size = uio->uio_offset + xfersize;
    323   1.1    bouyer 		}
    324  1.14       chs 		error = uiomove((char *)bp->b_data + blkoffset, xfersize, uio);
    325   1.1    bouyer 		if (ioflag & IO_SYNC)
    326   1.1    bouyer 			(void)bwrite(bp);
    327   1.1    bouyer 		else if (xfersize + blkoffset == fs->e2fs_bsize)
    328   1.1    bouyer 			if (doclusterwrite)
    329   1.1    bouyer 				cluster_write(bp, ip->i_e2fs_size);
    330   1.1    bouyer 			else
    331   1.1    bouyer 				bawrite(bp);
    332   1.1    bouyer 		else
    333   1.1    bouyer 			bdwrite(bp);
    334   1.1    bouyer 		if (error || xfersize == 0)
    335   1.1    bouyer 			break;
    336   1.1    bouyer 	}
    337   1.1    bouyer 	/*
    338   1.1    bouyer 	 * If we successfully wrote any data, and we are not the superuser
    339   1.1    bouyer 	 * we clear the setuid and setgid bits as a precaution against
    340   1.1    bouyer 	 * tampering.
    341   1.1    bouyer 	 */
    342  1.14       chs out:
    343  1.14       chs 	ip->i_flag |= IN_CHANGE | IN_UPDATE;
    344   1.1    bouyer 	if (resid > uio->uio_resid && ap->a_cred && ap->a_cred->cr_uid != 0)
    345   1.1    bouyer 		ip->i_e2fs_mode &= ~(ISUID | ISGID);
    346   1.1    bouyer 	if (error) {
    347   1.1    bouyer 		if (ioflag & IO_UNIT) {
    348   1.1    bouyer 			(void)VOP_TRUNCATE(vp, osize,
    349   1.1    bouyer 				ioflag & IO_SYNC, ap->a_cred, uio->uio_procp);
    350   1.1    bouyer 			uio->uio_offset -= resid - uio->uio_resid;
    351   1.1    bouyer 			uio->uio_resid = resid;
    352   1.1    bouyer 		}
    353   1.9   mycroft 	} else if (resid > uio->uio_resid && (ioflag & IO_SYNC) == IO_SYNC)
    354  1.12  perseant 		error = VOP_UPDATE(vp, NULL, NULL, UPDATE_WAIT);
    355   1.1    bouyer 	return (error);
    356   1.1    bouyer }
    357