1 1.117 joe /* $NetBSD: mfs_vfsops.c,v 1.117 2025/02/16 18:38:59 joe Exp $ */ 2 1.2 cgd 3 1.1 mycroft /* 4 1.1 mycroft * Copyright (c) 1989, 1990, 1993, 1994 5 1.1 mycroft * The Regents of the University of California. All rights reserved. 6 1.1 mycroft * 7 1.1 mycroft * Redistribution and use in source and binary forms, with or without 8 1.1 mycroft * modification, are permitted provided that the following conditions 9 1.1 mycroft * are met: 10 1.1 mycroft * 1. Redistributions of source code must retain the above copyright 11 1.1 mycroft * notice, this list of conditions and the following disclaimer. 12 1.1 mycroft * 2. Redistributions in binary form must reproduce the above copyright 13 1.1 mycroft * notice, this list of conditions and the following disclaimer in the 14 1.1 mycroft * documentation and/or other materials provided with the distribution. 15 1.52 agc * 3. Neither the name of the University nor the names of its contributors 16 1.1 mycroft * may be used to endorse or promote products derived from this software 17 1.1 mycroft * without specific prior written permission. 18 1.1 mycroft * 19 1.1 mycroft * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 20 1.1 mycroft * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 21 1.1 mycroft * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 22 1.1 mycroft * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 23 1.1 mycroft * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 24 1.1 mycroft * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 25 1.1 mycroft * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 26 1.1 mycroft * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27 1.1 mycroft * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 28 1.1 mycroft * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 29 1.1 mycroft * SUCH DAMAGE. 30 1.1 mycroft * 31 1.15 fvdl * @(#)mfs_vfsops.c 8.11 (Berkeley) 6/19/95 32 1.1 mycroft */ 33 1.36 lukem 34 1.36 lukem #include <sys/cdefs.h> 35 1.117 joe __KERNEL_RCSID(0, "$NetBSD: mfs_vfsops.c,v 1.117 2025/02/16 18:38:59 joe Exp $"); 36 1.17 jonathan 37 1.34 mrg #if defined(_KERNEL_OPT) 38 1.17 jonathan #include "opt_compat_netbsd.h" 39 1.17 jonathan #endif 40 1.1 mycroft 41 1.1 mycroft #include <sys/param.h> 42 1.1 mycroft #include <sys/systm.h> 43 1.54 atatat #include <sys/sysctl.h> 44 1.1 mycroft #include <sys/time.h> 45 1.1 mycroft #include <sys/kernel.h> 46 1.1 mycroft #include <sys/proc.h> 47 1.1 mycroft #include <sys/buf.h> 48 1.62 yamt #include <sys/bufq.h> 49 1.1 mycroft #include <sys/mount.h> 50 1.1 mycroft #include <sys/signalvar.h> 51 1.1 mycroft #include <sys/vnode.h> 52 1.91 ad #include <sys/kmem.h> 53 1.97 rumble #include <sys/module.h> 54 1.1 mycroft 55 1.88 dholland #include <miscfs/genfs/genfs.h> 56 1.87 pooka #include <miscfs/specfs/specdev.h> 57 1.33 thorpej 58 1.1 mycroft #include <ufs/ufs/quota.h> 59 1.1 mycroft #include <ufs/ufs/inode.h> 60 1.1 mycroft #include <ufs/ufs/ufsmount.h> 61 1.1 mycroft #include <ufs/ufs/ufs_extern.h> 62 1.1 mycroft 63 1.1 mycroft #include <ufs/ffs/fs.h> 64 1.1 mycroft #include <ufs/ffs/ffs_extern.h> 65 1.1 mycroft 66 1.1 mycroft #include <ufs/mfs/mfsnode.h> 67 1.1 mycroft #include <ufs/mfs/mfs_extern.h> 68 1.1 mycroft 69 1.99 ad MODULE(MODULE_CLASS_VFS, mfs, "ffs"); 70 1.97 rumble 71 1.91 ad kmutex_t mfs_lock; /* global lock */ 72 1.1 mycroft 73 1.102 pooka /* used for building internal dev_t, minor == 0 reserved for miniroot */ 74 1.109 hannken static devminor_t mfs_minor = 1; 75 1.91 ad static int mfs_initcnt; 76 1.1 mycroft 77 1.68 xtraeme extern int (**mfs_vnodeop_p)(void *); 78 1.44 thorpej 79 1.1 mycroft /* 80 1.1 mycroft * mfs vfs operations. 81 1.1 mycroft */ 82 1.14 thorpej 83 1.65 perry extern const struct vnodeopv_desc mfs_vnodeop_opv_desc; 84 1.14 thorpej 85 1.31 jdolecek const struct vnodeopv_desc * const mfs_vnodeopv_descs[] = { 86 1.14 thorpej &mfs_vnodeop_opv_desc, 87 1.14 thorpej NULL, 88 1.14 thorpej }; 89 1.14 thorpej 90 1.1 mycroft struct vfsops mfs_vfsops = { 91 1.106 hannken .vfs_name = MOUNT_MFS, 92 1.106 hannken .vfs_min_mount_data = sizeof (struct mfs_args), 93 1.106 hannken .vfs_mount = mfs_mount, 94 1.106 hannken .vfs_start = mfs_start, 95 1.106 hannken .vfs_unmount = ffs_unmount, 96 1.106 hannken .vfs_root = ufs_root, 97 1.106 hannken .vfs_quotactl = ufs_quotactl, 98 1.106 hannken .vfs_statvfs = mfs_statvfs, 99 1.106 hannken .vfs_sync = ffs_sync, 100 1.108 hannken .vfs_vget = ufs_vget, 101 1.108 hannken .vfs_loadvnode = ffs_loadvnode, 102 1.110 hannken .vfs_newvnode = ffs_newvnode, 103 1.106 hannken .vfs_fhtovp = ffs_fhtovp, 104 1.106 hannken .vfs_vptofh = ffs_vptofh, 105 1.106 hannken .vfs_init = mfs_init, 106 1.106 hannken .vfs_reinit = mfs_reinit, 107 1.106 hannken .vfs_done = mfs_done, 108 1.106 hannken .vfs_snapshot = (void *)eopnotsupp, 109 1.106 hannken .vfs_extattrctl = vfs_stdextattrctl, 110 1.111 hannken .vfs_suspendctl = genfs_suspendctl, 111 1.106 hannken .vfs_renamelock_enter = genfs_renamelock_enter, 112 1.106 hannken .vfs_renamelock_exit = genfs_renamelock_exit, 113 1.106 hannken .vfs_fsync = (void *)eopnotsupp, 114 1.106 hannken .vfs_opv_descs = mfs_vnodeopv_descs 115 1.1 mycroft }; 116 1.97 rumble 117 1.114 pgoyette SYSCTL_SETUP(mfs_sysctl_setup, "mfs sysctl") 118 1.114 pgoyette { 119 1.114 pgoyette 120 1.114 pgoyette sysctl_createv(clog, 0, NULL, NULL, 121 1.114 pgoyette CTLFLAG_PERMANENT|CTLFLAG_ALIAS, 122 1.114 pgoyette CTLTYPE_NODE, "mfs", 123 1.114 pgoyette SYSCTL_DESCR("Memory based file system"), 124 1.114 pgoyette NULL, 1, NULL, 0, 125 1.114 pgoyette CTL_VFS, 3, CTL_EOL); 126 1.114 pgoyette /* 127 1.114 pgoyette * XXX the "1" and the "3" above could be dynamic, thereby 128 1.114 pgoyette * eliminating one more instance of the "number to vfs" 129 1.114 pgoyette * mapping problem, but they are in order as taken from 130 1.114 pgoyette * sys/mount.h 131 1.114 pgoyette */ 132 1.114 pgoyette } 133 1.114 pgoyette 134 1.97 rumble static int 135 1.97 rumble mfs_modcmd(modcmd_t cmd, void *arg) 136 1.97 rumble { 137 1.98 rumble int error; 138 1.97 rumble 139 1.97 rumble switch (cmd) { 140 1.97 rumble case MODULE_CMD_INIT: 141 1.98 rumble error = vfs_attach(&mfs_vfsops); 142 1.98 rumble break; 143 1.97 rumble case MODULE_CMD_FINI: 144 1.98 rumble error = vfs_detach(&mfs_vfsops); 145 1.98 rumble break; 146 1.97 rumble default: 147 1.98 rumble error = ENOTTY; 148 1.98 rumble break; 149 1.97 rumble } 150 1.54 atatat 151 1.98 rumble return (error); 152 1.54 atatat } 153 1.1 mycroft 154 1.65 perry /* 155 1.15 fvdl * Memory based filesystem initialization. 156 1.65 perry */ 157 1.15 fvdl void 158 1.68 xtraeme mfs_init(void) 159 1.15 fvdl { 160 1.79 pooka 161 1.91 ad if (mfs_initcnt++ == 0) { 162 1.91 ad mutex_init(&mfs_lock, MUTEX_DEFAULT, IPL_NONE); 163 1.91 ad ffs_init(); 164 1.91 ad } 165 1.35 chs } 166 1.35 chs 167 1.35 chs void 168 1.68 xtraeme mfs_reinit(void) 169 1.35 chs { 170 1.91 ad 171 1.35 chs ffs_reinit(); 172 1.15 fvdl } 173 1.15 fvdl 174 1.23 jdolecek void 175 1.68 xtraeme mfs_done(void) 176 1.23 jdolecek { 177 1.91 ad 178 1.91 ad if (--mfs_initcnt == 0) { 179 1.91 ad ffs_done(); 180 1.91 ad mutex_destroy(&mfs_lock); 181 1.91 ad } 182 1.23 jdolecek } 183 1.15 fvdl 184 1.1 mycroft /* 185 1.1 mycroft * Called by main() when mfs is going to be mounted as root. 186 1.1 mycroft */ 187 1.1 mycroft 188 1.10 christos int 189 1.68 xtraeme mfs_mountroot(void) 190 1.1 mycroft { 191 1.15 fvdl struct fs *fs; 192 1.15 fvdl struct mount *mp; 193 1.71 christos struct lwp *l = curlwp; /* XXX */ 194 1.1 mycroft struct ufsmount *ump; 195 1.1 mycroft struct mfsnode *mfsp; 196 1.15 fvdl int error = 0; 197 1.1 mycroft 198 1.21 wrstuden if ((error = vfs_rootmountalloc(MOUNT_MFS, "mfs_root", &mp))) { 199 1.21 wrstuden vrele(rootvp); 200 1.15 fvdl return (error); 201 1.21 wrstuden } 202 1.1 mycroft 203 1.91 ad mfsp = kmem_alloc(sizeof(*mfsp), KM_SLEEP); 204 1.1 mycroft rootvp->v_data = mfsp; 205 1.1 mycroft rootvp->v_op = mfs_vnodeop_p; 206 1.1 mycroft rootvp->v_tag = VT_MFS; 207 1.1 mycroft mfsp->mfs_baseoff = mfs_rootbase; 208 1.1 mycroft mfsp->mfs_size = mfs_rootsize; 209 1.1 mycroft mfsp->mfs_vnode = rootvp; 210 1.26 thorpej mfsp->mfs_proc = NULL; /* indicate kernel space */ 211 1.39 hannken mfsp->mfs_shutdown = 0; 212 1.91 ad cv_init(&mfsp->mfs_cv, "mfs"); 213 1.91 ad mfsp->mfs_refcnt = 1; 214 1.70 yamt bufq_alloc(&mfsp->mfs_buflist, "fcfs", 0); 215 1.71 christos if ((error = ffs_mountfs(rootvp, mp, l)) != 0) { 216 1.113 hannken vfs_unbusy(mp); 217 1.70 yamt bufq_free(mfsp->mfs_buflist); 218 1.112 hannken vfs_rele(mp); 219 1.91 ad kmem_free(mfsp, sizeof(*mfsp)); 220 1.1 mycroft return (error); 221 1.65 perry } 222 1.104 christos mountlist_append(mp); 223 1.1 mycroft mp->mnt_vnodecovered = NULLVP; 224 1.1 mycroft ump = VFSTOUFS(mp); 225 1.1 mycroft fs = ump->um_fs; 226 1.15 fvdl (void) copystr(mp->mnt_stat.f_mntonname, fs->fs_fsmnt, MNAMELEN - 1, 0); 227 1.85 pooka (void)ffs_statvfs(mp, &mp->mnt_stat); 228 1.113 hannken vfs_unbusy(mp); 229 1.1 mycroft return (0); 230 1.1 mycroft } 231 1.1 mycroft 232 1.1 mycroft /* 233 1.1 mycroft * VFS Operations. 234 1.1 mycroft * 235 1.1 mycroft * mount system call 236 1.1 mycroft */ 237 1.1 mycroft /* ARGSUSED */ 238 1.1 mycroft int 239 1.85 pooka mfs_mount(struct mount *mp, const char *path, void *data, size_t *data_len) 240 1.1 mycroft { 241 1.85 pooka struct lwp *l = curlwp; 242 1.1 mycroft struct vnode *devvp; 243 1.80 dsl struct mfs_args *args = data; 244 1.1 mycroft struct ufsmount *ump; 245 1.25 augustss struct fs *fs; 246 1.25 augustss struct mfsnode *mfsp; 247 1.71 christos struct proc *p; 248 1.109 hannken devminor_t minor; 249 1.80 dsl int flags, error = 0; 250 1.80 dsl 251 1.107 maxv if (args == NULL) 252 1.107 maxv return EINVAL; 253 1.80 dsl if (*data_len < sizeof *args) 254 1.80 dsl return EINVAL; 255 1.37 chs 256 1.71 christos p = l->l_proc; 257 1.41 christos if (mp->mnt_flag & MNT_GETARGS) { 258 1.41 christos struct vnode *vp; 259 1.41 christos 260 1.41 christos ump = VFSTOUFS(mp); 261 1.41 christos if (ump == NULL) 262 1.41 christos return EIO; 263 1.41 christos 264 1.41 christos vp = ump->um_devvp; 265 1.41 christos if (vp == NULL) 266 1.41 christos return EIO; 267 1.41 christos 268 1.41 christos mfsp = VTOMFS(vp); 269 1.41 christos if (mfsp == NULL) 270 1.41 christos return EIO; 271 1.41 christos 272 1.80 dsl args->fspec = NULL; 273 1.80 dsl args->base = mfsp->mfs_baseoff; 274 1.80 dsl args->size = mfsp->mfs_size; 275 1.80 dsl *data_len = sizeof *args; 276 1.80 dsl return 0; 277 1.41 christos } 278 1.37 chs /* 279 1.37 chs * XXX turn off async to avoid hangs when writing lots of data. 280 1.37 chs * the problem is that MFS needs to allocate pages to clean pages, 281 1.37 chs * so if we wait until the last minute to clean pages then there 282 1.37 chs * may not be any pages available to do the cleaning. 283 1.42 chs * ... and since the default partially-synchronous mode turns out 284 1.42 chs * to not be sufficient under heavy load, make it full synchronous. 285 1.37 chs */ 286 1.37 chs mp->mnt_flag &= ~MNT_ASYNC; 287 1.42 chs mp->mnt_flag |= MNT_SYNCHRONOUS; 288 1.1 mycroft 289 1.1 mycroft /* 290 1.1 mycroft * If updating, check whether changing from read-only to 291 1.1 mycroft * read/write; if there is no device name, that's all we do. 292 1.1 mycroft */ 293 1.1 mycroft if (mp->mnt_flag & MNT_UPDATE) { 294 1.1 mycroft ump = VFSTOUFS(mp); 295 1.1 mycroft fs = ump->um_fs; 296 1.1 mycroft if (fs->fs_ronly == 0 && (mp->mnt_flag & MNT_RDONLY)) { 297 1.1 mycroft flags = WRITECLOSE; 298 1.1 mycroft if (mp->mnt_flag & MNT_FORCE) 299 1.1 mycroft flags |= FORCECLOSE; 300 1.71 christos error = ffs_flushfiles(mp, flags, l); 301 1.1 mycroft if (error) 302 1.1 mycroft return (error); 303 1.1 mycroft } 304 1.53 dbj if (fs->fs_ronly && (mp->mnt_iflag & IMNT_WANTRDWR)) 305 1.1 mycroft fs->fs_ronly = 0; 306 1.80 dsl if (args->fspec == NULL) 307 1.69 jmmv return EINVAL; 308 1.1 mycroft return (0); 309 1.1 mycroft } 310 1.109 hannken mutex_enter(&mfs_lock); 311 1.109 hannken minor = mfs_minor++; 312 1.109 hannken mutex_exit(&mfs_lock); 313 1.109 hannken error = bdevvp(makedev(255, minor), &devvp); 314 1.1 mycroft if (error) 315 1.1 mycroft return (error); 316 1.91 ad mfsp = kmem_alloc(sizeof(*mfsp), KM_SLEEP); 317 1.109 hannken /* 318 1.109 hannken * Changing v_op and v_data here is safe as we are 319 1.109 hannken * the exclusive owner of this device node. 320 1.109 hannken */ 321 1.109 hannken KASSERT(devvp->v_op == spec_vnodeop_p); 322 1.109 hannken KASSERT(devvp->v_data == NULL); 323 1.109 hannken devvp->v_op = mfs_vnodeop_p; 324 1.1 mycroft devvp->v_data = mfsp; 325 1.80 dsl mfsp->mfs_baseoff = args->base; 326 1.80 dsl mfsp->mfs_size = args->size; 327 1.1 mycroft mfsp->mfs_vnode = devvp; 328 1.26 thorpej mfsp->mfs_proc = p; 329 1.39 hannken mfsp->mfs_shutdown = 0; 330 1.90 ad cv_init(&mfsp->mfs_cv, "mfsidl"); 331 1.91 ad mfsp->mfs_refcnt = 1; 332 1.70 yamt bufq_alloc(&mfsp->mfs_buflist, "fcfs", 0); 333 1.71 christos if ((error = ffs_mountfs(devvp, mp, l)) != 0) { 334 1.39 hannken mfsp->mfs_shutdown = 1; 335 1.1 mycroft vrele(devvp); 336 1.1 mycroft return (error); 337 1.1 mycroft } 338 1.1 mycroft ump = VFSTOUFS(mp); 339 1.1 mycroft fs = ump->um_fs; 340 1.80 dsl error = set_statvfs_info(path, UIO_USERSPACE, args->fspec, 341 1.81 pooka UIO_USERSPACE, mp->mnt_op->vfs_name, mp, l); 342 1.58 christos if (error) 343 1.58 christos return error; 344 1.58 christos (void)strncpy(fs->fs_fsmnt, mp->mnt_stat.f_mntonname, 345 1.58 christos sizeof(fs->fs_fsmnt)); 346 1.58 christos fs->fs_fsmnt[sizeof(fs->fs_fsmnt) - 1] = '\0'; 347 1.57 enami /* XXX: cleanup on error */ 348 1.58 christos return 0; 349 1.1 mycroft } 350 1.1 mycroft 351 1.1 mycroft /* 352 1.1 mycroft * Used to grab the process and keep it in the kernel to service 353 1.1 mycroft * memory filesystem I/O requests. 354 1.1 mycroft * 355 1.28 thorpej * Loop servicing I/O requests. 356 1.28 thorpej * Copy the requested data into or out of the memory filesystem 357 1.28 thorpej * address space. 358 1.1 mycroft */ 359 1.1 mycroft /* ARGSUSED */ 360 1.1 mycroft int 361 1.85 pooka mfs_start(struct mount *mp, int flags) 362 1.1 mycroft { 363 1.91 ad struct vnode *vp; 364 1.91 ad struct mfsnode *mfsp; 365 1.77 ad struct proc *p; 366 1.28 thorpej struct buf *bp; 367 1.78 christos void *base; 368 1.91 ad int sleepreturn = 0, refcnt, error; 369 1.77 ad ksiginfoq_t kq; 370 1.1 mycroft 371 1.91 ad /* 372 1.91 ad * Ensure that file system is still mounted when getting mfsnode. 373 1.91 ad * Add a reference to the mfsnode to prevent it disappearing in 374 1.91 ad * this routine. 375 1.91 ad */ 376 1.113 hannken if ((error = vfs_busy(mp)) != 0) 377 1.91 ad return error; 378 1.91 ad vp = VFSTOUFS(mp)->um_devvp; 379 1.91 ad mfsp = VTOMFS(vp); 380 1.91 ad mutex_enter(&mfs_lock); 381 1.91 ad mfsp->mfs_refcnt++; 382 1.91 ad mutex_exit(&mfs_lock); 383 1.113 hannken vfs_unbusy(mp); 384 1.91 ad 385 1.28 thorpej base = mfsp->mfs_baseoff; 386 1.91 ad mutex_enter(&mfs_lock); 387 1.39 hannken while (mfsp->mfs_shutdown != 1) { 388 1.101 yamt while ((bp = bufq_get(mfsp->mfs_buflist)) != NULL) { 389 1.91 ad mutex_exit(&mfs_lock); 390 1.30 simonb mfs_doio(bp, base); 391 1.91 ad mutex_enter(&mfs_lock); 392 1.30 simonb } 393 1.1 mycroft /* 394 1.1 mycroft * If a non-ignored signal is received, try to unmount. 395 1.15 fvdl * If that fails, or the filesystem is already in the 396 1.15 fvdl * process of being unmounted, clear the signal (it has been 397 1.15 fvdl * "processed"), otherwise we will loop here, as tsleep 398 1.15 fvdl * will always return EINTR/ERESTART. 399 1.1 mycroft */ 400 1.15 fvdl if (sleepreturn != 0) { 401 1.91 ad mutex_exit(&mfs_lock); 402 1.96 ad if (dounmount(mp, 0, curlwp) != 0) { 403 1.91 ad p = curproc; 404 1.77 ad ksiginfo_queue_init(&kq); 405 1.92 ad mutex_enter(p->p_lock); 406 1.77 ad sigclearall(p, NULL, &kq); 407 1.92 ad mutex_exit(p->p_lock); 408 1.77 ad ksiginfo_queue_drain(&kq); 409 1.77 ad } 410 1.15 fvdl sleepreturn = 0; 411 1.91 ad mutex_enter(&mfs_lock); 412 1.12 fvdl continue; 413 1.9 mycroft } 414 1.28 thorpej 415 1.91 ad sleepreturn = cv_wait_sig(&mfsp->mfs_cv, &mfs_lock); 416 1.1 mycroft } 417 1.101 yamt KASSERT(bufq_peek(mfsp->mfs_buflist) == NULL); 418 1.91 ad refcnt = --mfsp->mfs_refcnt; 419 1.91 ad mutex_exit(&mfs_lock); 420 1.91 ad if (refcnt == 0) { 421 1.91 ad bufq_free(mfsp->mfs_buflist); 422 1.91 ad cv_destroy(&mfsp->mfs_cv); 423 1.91 ad kmem_free(mfsp, sizeof(*mfsp)); 424 1.91 ad } 425 1.15 fvdl return (sleepreturn); 426 1.1 mycroft } 427 1.1 mycroft 428 1.1 mycroft /* 429 1.1 mycroft * Get file system statistics. 430 1.1 mycroft */ 431 1.10 christos int 432 1.85 pooka mfs_statvfs(struct mount *mp, struct statvfs *sbp) 433 1.1 mycroft { 434 1.1 mycroft int error; 435 1.1 mycroft 436 1.85 pooka error = ffs_statvfs(mp, sbp); 437 1.58 christos if (error) 438 1.58 christos return error; 439 1.58 christos (void)strncpy(sbp->f_fstypename, mp->mnt_op->vfs_name, 440 1.58 christos sizeof(sbp->f_fstypename)); 441 1.58 christos sbp->f_fstypename[sizeof(sbp->f_fstypename) - 1] = '\0'; 442 1.58 christos return 0; 443 1.1 mycroft } 444