lfs_vfsops.c revision 1.10 1 /* $NetBSD: lfs_vfsops.c,v 1.10 1996/02/09 22:28:58 christos Exp $ */
2
3 /*
4 * Copyright (c) 1989, 1991, 1993, 1994
5 * The Regents of the University of California. All rights reserved.
6 *
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
9 * are met:
10 * 1. Redistributions of source code must retain the above copyright
11 * notice, this list of conditions and the following disclaimer.
12 * 2. Redistributions in binary form must reproduce the above copyright
13 * notice, this list of conditions and the following disclaimer in the
14 * documentation and/or other materials provided with the distribution.
15 * 3. All advertising materials mentioning features or use of this software
16 * must display the following acknowledgement:
17 * This product includes software developed by the University of
18 * California, Berkeley and its contributors.
19 * 4. Neither the name of the University nor the names of its contributors
20 * may be used to endorse or promote products derived from this software
21 * without specific prior written permission.
22 *
23 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
24 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
27 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
28 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
29 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
30 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
31 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
32 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
33 * SUCH DAMAGE.
34 *
35 * @(#)lfs_vfsops.c 8.10 (Berkeley) 11/21/94
36 */
37
38 #include <sys/param.h>
39 #include <sys/systm.h>
40 #include <sys/namei.h>
41 #include <sys/proc.h>
42 #include <sys/kernel.h>
43 #include <sys/vnode.h>
44 #include <sys/mount.h>
45 #include <sys/buf.h>
46 #include <sys/mbuf.h>
47 #include <sys/file.h>
48 #include <sys/disklabel.h>
49 #include <sys/ioctl.h>
50 #include <sys/errno.h>
51 #include <sys/malloc.h>
52 #include <sys/socket.h>
53
54 #include <miscfs/specfs/specdev.h>
55
56 #include <ufs/ufs/quota.h>
57 #include <ufs/ufs/inode.h>
58 #include <ufs/ufs/ufsmount.h>
59 #include <ufs/ufs/ufs_extern.h>
60
61 #include <ufs/lfs/lfs.h>
62 #include <ufs/lfs/lfs_extern.h>
63
64 int lfs_mountfs __P((struct vnode *, struct mount *, struct proc *));
65
66 struct vfsops lfs_vfsops = {
67 MOUNT_LFS,
68 lfs_mount,
69 ufs_start,
70 lfs_unmount,
71 ufs_root,
72 ufs_quotactl,
73 lfs_statfs,
74 lfs_sync,
75 lfs_vget,
76 lfs_fhtovp,
77 lfs_vptofh,
78 lfs_init,
79 };
80
81 int
82 lfs_mountroot()
83 {
84 panic("lfs_mountroot"); /* XXX -- implement */
85 return 0;
86 }
87
88 /*
89 * VFS Operations.
90 *
91 * mount system call
92 */
93 int
94 lfs_mount(mp, path, data, ndp, p)
95 register struct mount *mp;
96 char *path;
97 caddr_t data;
98 struct nameidata *ndp;
99 struct proc *p;
100 {
101 struct vnode *devvp;
102 struct ufs_args args;
103 struct ufsmount *ump = NULL;
104 register struct lfs *fs = NULL; /* LFS */
105 size_t size;
106 int error;
107 mode_t accessmode;
108
109 error = copyin(data, (caddr_t)&args, sizeof (struct ufs_args));
110 if (error)
111 return (error);
112
113 /* Until LFS can do NFS right. XXX */
114 if (args.export.ex_flags & MNT_EXPORTED)
115 return (EINVAL);
116
117 /*
118 * If updating, check whether changing from read-only to
119 * read/write; if there is no device name, that's all we do.
120 */
121 if (mp->mnt_flag & MNT_UPDATE) {
122 ump = VFSTOUFS(mp);
123 if (fs->lfs_ronly && (mp->mnt_flag & MNT_WANTRDWR)) {
124 /*
125 * If upgrade to read-write by non-root, then verify
126 * that user has necessary permissions on the device.
127 */
128 if (p->p_ucred->cr_uid != 0) {
129 VOP_LOCK(ump->um_devvp);
130 error = VOP_ACCESS(ump->um_devvp, VREAD|VWRITE,
131 p->p_ucred, p);
132 if (error) {
133 VOP_UNLOCK(ump->um_devvp);
134 return (error);
135 }
136 VOP_UNLOCK(ump->um_devvp);
137 }
138 fs->lfs_ronly = 0;
139 }
140 if (args.fspec == 0) {
141 /*
142 * Process export requests.
143 */
144 return (vfs_export(mp, &ump->um_export, &args.export));
145 }
146 }
147 /*
148 * Not an update, or updating the name: look up the name
149 * and verify that it refers to a sensible block device.
150 */
151 NDINIT(ndp, LOOKUP, FOLLOW, UIO_USERSPACE, args.fspec, p);
152 if ((error = namei(ndp)) != 0)
153 return (error);
154 devvp = ndp->ni_vp;
155 if (devvp->v_type != VBLK) {
156 vrele(devvp);
157 return (ENOTBLK);
158 }
159 if (major(devvp->v_rdev) >= nblkdev) {
160 vrele(devvp);
161 return (ENXIO);
162 }
163 /*
164 * If mount by non-root, then verify that user has necessary
165 * permissions on the device.
166 */
167 if (p->p_ucred->cr_uid != 0) {
168 accessmode = VREAD;
169 if ((mp->mnt_flag & MNT_RDONLY) == 0)
170 accessmode |= VWRITE;
171 VOP_LOCK(devvp);
172 error = VOP_ACCESS(devvp, accessmode, p->p_ucred, p);
173 if (error) {
174 vput(devvp);
175 return (error);
176 }
177 VOP_UNLOCK(devvp);
178 }
179 if ((mp->mnt_flag & MNT_UPDATE) == 0)
180 error = lfs_mountfs(devvp, mp, p); /* LFS */
181 else {
182 if (devvp != ump->um_devvp)
183 error = EINVAL; /* needs translation */
184 else
185 vrele(devvp);
186 }
187 if (error) {
188 vrele(devvp);
189 return (error);
190 }
191 ump = VFSTOUFS(mp);
192 fs = ump->um_lfs; /* LFS */
193 #ifdef NOTLFS /* LFS */
194 (void) copyinstr(path, fs->fs_fsmnt, sizeof(fs->fs_fsmnt) - 1, &size);
195 bzero(fs->fs_fsmnt + size, sizeof(fs->fs_fsmnt) - size);
196 bcopy(fs->fs_fsmnt, mp->mnt_stat.f_mntonname, MNAMELEN);
197 #else
198 (void)copyinstr(path, fs->lfs_fsmnt, sizeof(fs->lfs_fsmnt) - 1, &size);
199 bzero(fs->lfs_fsmnt + size, sizeof(fs->lfs_fsmnt) - size);
200 bcopy(fs->lfs_fsmnt, mp->mnt_stat.f_mntonname, MNAMELEN);
201 #endif
202 (void) copyinstr(args.fspec, mp->mnt_stat.f_mntfromname, MNAMELEN - 1,
203 &size);
204 bzero(mp->mnt_stat.f_mntfromname + size, MNAMELEN - size);
205 return (0);
206 }
207
208 /*
209 * Common code for mount and mountroot
210 * LFS specific
211 */
212 int
213 lfs_mountfs(devvp, mp, p)
214 register struct vnode *devvp;
215 struct mount *mp;
216 struct proc *p;
217 {
218 extern struct vnode *rootvp;
219 register struct lfs *fs;
220 register struct ufsmount *ump;
221 struct vnode *vp;
222 struct buf *bp;
223 struct partinfo dpart;
224 dev_t dev;
225 int error, i, ronly, size;
226 struct ucred *cred;
227
228 cred = p ? p->p_ucred : NOCRED;
229 /*
230 * Disallow multiple mounts of the same device.
231 * Disallow mounting of a device that is currently in use
232 * (except for root, which might share swap device for miniroot).
233 * Flush out any old buffers remaining from a previous use.
234 */
235 if ((error = vfs_mountedon(devvp)) != 0)
236 return (error);
237 if (vcount(devvp) > 1 && devvp != rootvp)
238 return (EBUSY);
239 if ((error = vinvalbuf(devvp, V_SAVE, cred, p, 0, 0)) != 0)
240 return (error);
241
242 ronly = (mp->mnt_flag & MNT_RDONLY) != 0;
243 error = VOP_OPEN(devvp, ronly ? FREAD : FREAD|FWRITE, FSCRED, p);
244 if (error)
245 return (error);
246
247 if (VOP_IOCTL(devvp, DIOCGPART, (caddr_t)&dpart, FREAD, cred, p) != 0)
248 size = DEV_BSIZE;
249 else {
250 size = dpart.disklab->d_secsize;
251 #ifdef NEVER_USED
252 dpart.part->p_fstype = FS_LFS;
253 dpart.part->p_fsize = fs->lfs_fsize; /* frag size */
254 dpart.part->p_frag = fs->lfs_frag; /* frags per block */
255 dpart.part->p_cpg = fs->lfs_segshift; /* segment shift */
256 #endif
257 }
258
259 /* Don't free random space on error. */
260 bp = NULL;
261 ump = NULL;
262
263 /* Read in the superblock. */
264 error = bread(devvp, LFS_LABELPAD / size, LFS_SBPAD, cred, &bp);
265 if (error)
266 goto out;
267 fs = (struct lfs *)bp->b_data;
268
269 /* Check the basics. */
270 if (fs->lfs_magic != LFS_MAGIC || fs->lfs_bsize > MAXBSIZE ||
271 fs->lfs_bsize < sizeof(struct lfs)) {
272 error = EINVAL; /* XXX needs translation */
273 goto out;
274 }
275
276 /* Allocate the mount structure, copy the superblock into it. */
277 ump = (struct ufsmount *)malloc(sizeof *ump, M_UFSMNT, M_WAITOK);
278 fs = ump->um_lfs = malloc(sizeof(struct lfs), M_UFSMNT, M_WAITOK);
279 bcopy(bp->b_data, fs, sizeof(struct lfs));
280 if (sizeof(struct lfs) < LFS_SBPAD) /* XXX why? */
281 bp->b_flags |= B_INVAL;
282 brelse(bp);
283 bp = NULL;
284
285 /* Set up the I/O information */
286 fs->lfs_iocount = 0;
287
288 /* Set up the ifile and lock aflags */
289 fs->lfs_doifile = 0;
290 fs->lfs_writer = 0;
291 fs->lfs_dirops = 0;
292 fs->lfs_seglock = 0;
293
294 /* Set the file system readonly/modify bits. */
295 fs->lfs_ronly = ronly;
296 if (ronly == 0)
297 fs->lfs_fmod = 1;
298
299 /* Initialize the mount structure. */
300 dev = devvp->v_rdev;
301 mp->mnt_data = (qaddr_t)ump;
302 mp->mnt_stat.f_fsid.val[0] = (long)dev;
303 mp->mnt_stat.f_fsid.val[1] = makefstype(MOUNT_LFS);
304 mp->mnt_maxsymlinklen = fs->lfs_maxsymlinklen;
305 mp->mnt_flag |= MNT_LOCAL;
306 ump->um_mountp = mp;
307 ump->um_dev = dev;
308 ump->um_devvp = devvp;
309 ump->um_bptrtodb = 0;
310 ump->um_seqinc = 1 << fs->lfs_fsbtodb;
311 ump->um_nindir = fs->lfs_nindir;
312 for (i = 0; i < MAXQUOTAS; i++)
313 ump->um_quotas[i] = NULLVP;
314 devvp->v_specflags |= SI_MOUNTEDON;
315
316 /*
317 * We use the ifile vnode for almost every operation. Instead of
318 * retrieving it from the hash table each time we retrieve it here,
319 * artificially increment the reference count and keep a pointer
320 * to it in the incore copy of the superblock.
321 */
322 if ((error = VFS_VGET(mp, LFS_IFILE_INUM, &vp)) != 0)
323 goto out;
324 fs->lfs_ivnode = vp;
325 VREF(vp);
326 vput(vp);
327
328 return (0);
329 out:
330 if (bp)
331 brelse(bp);
332 (void)VOP_CLOSE(devvp, ronly ? FREAD : FREAD|FWRITE, cred, p);
333 if (ump) {
334 free(ump->um_lfs, M_UFSMNT);
335 free(ump, M_UFSMNT);
336 mp->mnt_data = (qaddr_t)0;
337 }
338 return (error);
339 }
340
341 /*
342 * unmount system call
343 */
344 int
345 lfs_unmount(mp, mntflags, p)
346 struct mount *mp;
347 int mntflags;
348 struct proc *p;
349 {
350 register struct ufsmount *ump;
351 register struct lfs *fs;
352 int i, error, flags, ronly;
353
354 flags = 0;
355 if (mntflags & MNT_FORCE)
356 flags |= FORCECLOSE;
357
358 ump = VFSTOUFS(mp);
359 fs = ump->um_lfs;
360 #ifdef QUOTA
361 if (mp->mnt_flag & MNT_QUOTA) {
362 error = vflush(mp, fs->lfs_ivnode, SKIPSYSTEM|flags);
363 if (error)
364 return (error);
365 for (i = 0; i < MAXQUOTAS; i++) {
366 if (ump->um_quotas[i] == NULLVP)
367 continue;
368 quotaoff(p, mp, i);
369 }
370 /*
371 * Here we fall through to vflush again to ensure
372 * that we have gotten rid of all the system vnodes.
373 */
374 }
375 #endif
376 if ((error = vflush(mp, fs->lfs_ivnode, flags)) != 0)
377 return (error);
378 fs->lfs_clean = 1;
379 if ((error = VFS_SYNC(mp, 1, p->p_ucred, p)) != 0)
380 return (error);
381 if (fs->lfs_ivnode->v_dirtyblkhd.lh_first)
382 panic("lfs_unmount: still dirty blocks on ifile vnode\n");
383 vrele(fs->lfs_ivnode);
384 vgone(fs->lfs_ivnode);
385
386 ronly = !fs->lfs_ronly;
387 ump->um_devvp->v_specflags &= ~SI_MOUNTEDON;
388 error = VOP_CLOSE(ump->um_devvp,
389 ronly ? FREAD : FREAD|FWRITE, NOCRED, p);
390 vrele(ump->um_devvp);
391 free(fs, M_UFSMNT);
392 free(ump, M_UFSMNT);
393 mp->mnt_data = (qaddr_t)0;
394 mp->mnt_flag &= ~MNT_LOCAL;
395 return (error);
396 }
397
398 /*
399 * Get file system statistics.
400 */
401 int
402 lfs_statfs(mp, sbp, p)
403 struct mount *mp;
404 register struct statfs *sbp;
405 struct proc *p;
406 {
407 register struct lfs *fs;
408 register struct ufsmount *ump;
409
410 ump = VFSTOUFS(mp);
411 fs = ump->um_lfs;
412 if (fs->lfs_magic != LFS_MAGIC)
413 panic("lfs_statfs: magic");
414 sbp->f_type = 0;
415 sbp->f_bsize = fs->lfs_bsize;
416 sbp->f_iosize = fs->lfs_bsize;
417 sbp->f_blocks = dbtofsb(fs,fs->lfs_dsize);
418 sbp->f_bfree = dbtofsb(fs, fs->lfs_bfree);
419 sbp->f_bavail = (fs->lfs_dsize * (100 - fs->lfs_minfree) / 100) -
420 (fs->lfs_dsize - fs->lfs_bfree);
421 sbp->f_bavail = dbtofsb(fs, sbp->f_bavail);
422 sbp->f_files = fs->lfs_nfiles;
423 sbp->f_ffree = sbp->f_bfree * INOPB(fs);
424 if (sbp != &mp->mnt_stat) {
425 bcopy(mp->mnt_stat.f_mntonname, sbp->f_mntonname, MNAMELEN);
426 bcopy(mp->mnt_stat.f_mntfromname, sbp->f_mntfromname, MNAMELEN);
427 }
428 strncpy(sbp->f_fstypename, mp->mnt_op->vfs_name, MFSNAMELEN);
429 return (0);
430 }
431
432 /*
433 * Go through the disk queues to initiate sandbagged IO;
434 * go through the inodes to write those that have been modified;
435 * initiate the writing of the super block if it has been modified.
436 *
437 * Note: we are always called with the filesystem marked `MPBUSY'.
438 */
439 int
440 lfs_sync(mp, waitfor, cred, p)
441 struct mount *mp;
442 int waitfor;
443 struct ucred *cred;
444 struct proc *p;
445 {
446 int error;
447
448 /* All syncs must be checkpoints until roll-forward is implemented. */
449 error = lfs_segwrite(mp, SEGM_CKP | (waitfor ? SEGM_SYNC : 0));
450 #ifdef QUOTA
451 qsync(mp);
452 #endif
453 return (error);
454 }
455
456 /*
457 * Look up an LFS dinode number to find its incore vnode. If not already
458 * in core, read it in from the specified device. Return the inode locked.
459 * Detection and handling of mount points must be done by the calling routine.
460 */
461 int
462 lfs_vget(mp, ino, vpp)
463 struct mount *mp;
464 ino_t ino;
465 struct vnode **vpp;
466 {
467 register struct lfs *fs;
468 register struct inode *ip;
469 struct buf *bp;
470 struct ifile *ifp;
471 struct vnode *vp;
472 struct ufsmount *ump;
473 daddr_t daddr;
474 dev_t dev;
475 int error;
476
477 ump = VFSTOUFS(mp);
478 dev = ump->um_dev;
479 if ((*vpp = ufs_ihashget(dev, ino)) != NULL)
480 return (0);
481
482 /* Translate the inode number to a disk address. */
483 fs = ump->um_lfs;
484 if (ino == LFS_IFILE_INUM)
485 daddr = fs->lfs_idaddr;
486 else {
487 LFS_IENTRY(ifp, fs, ino, bp);
488 daddr = ifp->if_daddr;
489 brelse(bp);
490 if (daddr == LFS_UNUSED_DADDR)
491 return (ENOENT);
492 }
493
494 /* Allocate new vnode/inode. */
495 if ((error = lfs_vcreate(mp, ino, &vp)) != 0) {
496 *vpp = NULL;
497 return (error);
498 }
499
500 /*
501 * Put it onto its hash chain and lock it so that other requests for
502 * this inode will block if they arrive while we are sleeping waiting
503 * for old data structures to be purged or for the contents of the
504 * disk portion of this inode to be read.
505 */
506 ip = VTOI(vp);
507 ufs_ihashins(ip);
508
509 /*
510 * XXX
511 * This may not need to be here, logically it should go down with
512 * the i_devvp initialization.
513 * Ask Kirk.
514 */
515 ip->i_lfs = ump->um_lfs;
516
517 /* Read in the disk contents for the inode, copy into the inode. */
518 error = bread(ump->um_devvp, daddr, (int)fs->lfs_bsize, NOCRED, &bp);
519 if (error) {
520 /*
521 * The inode does not contain anything useful, so it would
522 * be misleading to leave it on its hash chain. With mode
523 * still zero, it will be unlinked and returned to the free
524 * list by vput().
525 */
526 vput(vp);
527 brelse(bp);
528 *vpp = NULL;
529 return (error);
530 }
531 ip->i_din = *lfs_ifind(fs, ino, (struct dinode *)bp->b_data);
532 brelse(bp);
533
534 /*
535 * Initialize the vnode from the inode, check for aliases. In all
536 * cases re-init ip, the underlying vnode/inode may have changed.
537 */
538 error = ufs_vinit(mp, lfs_specop_p, LFS_FIFOOPS, &vp);
539 if (error) {
540 vput(vp);
541 *vpp = NULL;
542 return (error);
543 }
544 /*
545 * Finish inode initialization now that aliasing has been resolved.
546 */
547 ip->i_devvp = ump->um_devvp;
548 VREF(ip->i_devvp);
549 *vpp = vp;
550 return (0);
551 }
552
553 /*
554 * File handle to vnode
555 *
556 * Have to be really careful about stale file handles:
557 * - check that the inode number is valid
558 * - call lfs_vget() to get the locked inode
559 * - check for an unallocated inode (i_mode == 0)
560 * - check that the given client host has export rights and return
561 * those rights via. exflagsp and credanonp
562 *
563 * XXX
564 * use ifile to see if inode is allocated instead of reading off disk
565 * what is the relationship between my generational number and the NFS
566 * generational number.
567 */
568 int
569 lfs_fhtovp(mp, fhp, nam, vpp, exflagsp, credanonp)
570 register struct mount *mp;
571 struct fid *fhp;
572 struct mbuf *nam;
573 struct vnode **vpp;
574 int *exflagsp;
575 struct ucred **credanonp;
576 {
577 register struct ufid *ufhp;
578
579 ufhp = (struct ufid *)fhp;
580 if (ufhp->ufid_ino < ROOTINO)
581 return (ESTALE);
582 return (ufs_check_export(mp, ufhp, nam, vpp, exflagsp, credanonp));
583 }
584
585 /*
586 * Vnode pointer to File handle
587 */
588 /* ARGSUSED */
589 int
590 lfs_vptofh(vp, fhp)
591 struct vnode *vp;
592 struct fid *fhp;
593 {
594 register struct inode *ip;
595 register struct ufid *ufhp;
596
597 ip = VTOI(vp);
598 ufhp = (struct ufid *)fhp;
599 ufhp->ufid_len = sizeof(struct ufid);
600 ufhp->ufid_ino = ip->i_number;
601 ufhp->ufid_gen = ip->i_gen;
602 return (0);
603 }
604