rumpfs.c revision 1.30 1 1.30 pooka /* $NetBSD: rumpfs.c,v 1.30 2009/11/26 20:58:51 pooka Exp $ */
2 1.1 pooka
3 1.1 pooka /*
4 1.30 pooka * Copyright (c) 2009 Antti Kantee. All Rights Reserved.
5 1.1 pooka *
6 1.1 pooka * Redistribution and use in source and binary forms, with or without
7 1.1 pooka * modification, are permitted provided that the following conditions
8 1.1 pooka * are met:
9 1.1 pooka * 1. Redistributions of source code must retain the above copyright
10 1.1 pooka * notice, this list of conditions and the following disclaimer.
11 1.1 pooka * 2. Redistributions in binary form must reproduce the above copyright
12 1.1 pooka * notice, this list of conditions and the following disclaimer in the
13 1.1 pooka * documentation and/or other materials provided with the distribution.
14 1.1 pooka *
15 1.1 pooka * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
16 1.1 pooka * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
17 1.1 pooka * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
18 1.1 pooka * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
19 1.1 pooka * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20 1.1 pooka * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
21 1.1 pooka * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22 1.1 pooka * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
23 1.1 pooka * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
24 1.1 pooka * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
25 1.1 pooka * SUCH DAMAGE.
26 1.1 pooka */
27 1.1 pooka
28 1.3 pooka #include <sys/cdefs.h>
29 1.30 pooka __KERNEL_RCSID(0, "$NetBSD: rumpfs.c,v 1.30 2009/11/26 20:58:51 pooka Exp $");
30 1.3 pooka
31 1.1 pooka #include <sys/param.h>
32 1.24 pooka #include <sys/atomic.h>
33 1.24 pooka #include <sys/filedesc.h>
34 1.1 pooka #include <sys/errno.h>
35 1.24 pooka #include <sys/fcntl.h>
36 1.1 pooka #include <sys/kauth.h>
37 1.24 pooka #include <sys/malloc.h>
38 1.30 pooka #include <sys/module.h>
39 1.24 pooka #include <sys/mount.h>
40 1.24 pooka #include <sys/namei.h>
41 1.1 pooka #include <sys/lock.h>
42 1.1 pooka #include <sys/lockf.h>
43 1.24 pooka #include <sys/queue.h>
44 1.1 pooka #include <sys/stat.h>
45 1.1 pooka #include <sys/syscallargs.h>
46 1.24 pooka #include <sys/vnode.h>
47 1.1 pooka
48 1.1 pooka #include <miscfs/fifofs/fifo.h>
49 1.1 pooka #include <miscfs/specfs/specdev.h>
50 1.1 pooka #include <miscfs/genfs/genfs.h>
51 1.1 pooka
52 1.1 pooka #include <rump/rumpuser.h>
53 1.1 pooka
54 1.1 pooka #include "rump_private.h"
55 1.1 pooka #include "rump_vfs_private.h"
56 1.1 pooka
57 1.1 pooka static int rump_vop_lookup(void *);
58 1.9 pooka static int rump_vop_getattr(void *);
59 1.14 pooka static int rump_vop_mkdir(void *);
60 1.19 pooka static int rump_vop_mknod(void *);
61 1.26 pooka static int rump_vop_create(void *);
62 1.14 pooka static int rump_vop_inactive(void *);
63 1.12 pooka static int rump_vop_reclaim(void *);
64 1.9 pooka static int rump_vop_success(void *);
65 1.19 pooka static int rump_vop_spec(void *);
66 1.24 pooka static int rump_vop_read(void *);
67 1.24 pooka static int rump_vop_write(void *);
68 1.24 pooka static int rump_vop_open(void *);
69 1.1 pooka
70 1.1 pooka int (**fifo_vnodeop_p)(void *);
71 1.1 pooka const struct vnodeopv_entry_desc fifo_vnodeop_entries[] = {
72 1.1 pooka { &vop_default_desc, vn_default_error },
73 1.1 pooka { NULL, NULL }
74 1.1 pooka };
75 1.1 pooka const struct vnodeopv_desc fifo_vnodeop_opv_desc =
76 1.1 pooka { &fifo_vnodeop_p, fifo_vnodeop_entries };
77 1.1 pooka
78 1.1 pooka int (**rump_vnodeop_p)(void *);
79 1.1 pooka const struct vnodeopv_entry_desc rump_vnodeop_entries[] = {
80 1.1 pooka { &vop_default_desc, vn_default_error },
81 1.1 pooka { &vop_lookup_desc, rump_vop_lookup },
82 1.9 pooka { &vop_getattr_desc, rump_vop_getattr },
83 1.14 pooka { &vop_mkdir_desc, rump_vop_mkdir },
84 1.19 pooka { &vop_mknod_desc, rump_vop_mknod },
85 1.26 pooka { &vop_create_desc, rump_vop_create },
86 1.19 pooka { &vop_access_desc, rump_vop_success },
87 1.24 pooka { &vop_read_desc, rump_vop_read },
88 1.24 pooka { &vop_write_desc, rump_vop_write },
89 1.24 pooka { &vop_open_desc, rump_vop_open },
90 1.13 pooka { &vop_putpages_desc, genfs_null_putpages },
91 1.9 pooka { &vop_fsync_desc, rump_vop_success },
92 1.1 pooka { &vop_lock_desc, genfs_lock },
93 1.1 pooka { &vop_unlock_desc, genfs_unlock },
94 1.14 pooka { &vop_inactive_desc, rump_vop_inactive },
95 1.12 pooka { &vop_reclaim_desc, rump_vop_reclaim },
96 1.1 pooka { NULL, NULL }
97 1.1 pooka };
98 1.1 pooka const struct vnodeopv_desc rump_vnodeop_opv_desc =
99 1.1 pooka { &rump_vnodeop_p, rump_vnodeop_entries };
100 1.19 pooka
101 1.19 pooka int (**rump_specop_p)(void *);
102 1.19 pooka const struct vnodeopv_entry_desc rump_specop_entries[] = {
103 1.19 pooka { &vop_default_desc, rump_vop_spec },
104 1.19 pooka { NULL, NULL }
105 1.19 pooka };
106 1.19 pooka const struct vnodeopv_desc rump_specop_opv_desc =
107 1.19 pooka { &rump_specop_p, rump_specop_entries };
108 1.19 pooka
109 1.1 pooka const struct vnodeopv_desc * const rump_opv_descs[] = {
110 1.1 pooka &rump_vnodeop_opv_desc,
111 1.19 pooka &rump_specop_opv_desc,
112 1.1 pooka NULL
113 1.1 pooka };
114 1.1 pooka
115 1.14 pooka struct rumpfs_dent {
116 1.14 pooka char *rd_name;
117 1.14 pooka struct rumpfs_node *rd_node;
118 1.14 pooka
119 1.14 pooka LIST_ENTRY(rumpfs_dent) rd_entries;
120 1.14 pooka };
121 1.14 pooka
122 1.14 pooka struct rumpfs_node {
123 1.14 pooka struct vattr rn_va;
124 1.14 pooka struct vnode *rn_vp;
125 1.14 pooka
126 1.24 pooka union {
127 1.24 pooka struct {
128 1.24 pooka char *hostpath; /* VREG */
129 1.24 pooka int readfd;
130 1.24 pooka int writefd;
131 1.27 pooka uint64_t offset;
132 1.24 pooka } reg;
133 1.24 pooka LIST_HEAD(, rumpfs_dent) dir; /* VDIR */
134 1.24 pooka } rn_u;
135 1.14 pooka };
136 1.24 pooka #define rn_hostpath rn_u.reg.hostpath
137 1.24 pooka #define rn_readfd rn_u.reg.readfd
138 1.24 pooka #define rn_writefd rn_u.reg.writefd
139 1.27 pooka #define rn_offset rn_u.reg.offset
140 1.24 pooka #define rn_dir rn_u.dir
141 1.14 pooka
142 1.30 pooka struct rumpfs_mount {
143 1.30 pooka struct vnode *rfsmp_rvp;
144 1.30 pooka };
145 1.30 pooka
146 1.27 pooka static struct rumpfs_node *makeprivate(enum vtype, dev_t, off_t);
147 1.21 pooka
148 1.21 pooka /*
149 1.21 pooka * Extra Terrestrial stuff. We map a given key (pathname) to a file on
150 1.21 pooka * the host FS. ET phones home only from the root node of rumpfs.
151 1.21 pooka *
152 1.21 pooka * When an etfs node is removed, a vnode potentially behind it is not
153 1.21 pooka * immediately recycled.
154 1.21 pooka */
155 1.21 pooka
156 1.21 pooka struct etfs {
157 1.21 pooka char et_key[MAXPATHLEN];
158 1.24 pooka size_t et_keylen;
159 1.24 pooka
160 1.21 pooka LIST_ENTRY(etfs) et_entries;
161 1.21 pooka
162 1.21 pooka struct rumpfs_node *et_rn;
163 1.21 pooka };
164 1.21 pooka static kmutex_t etfs_lock;
165 1.21 pooka static LIST_HEAD(, etfs) etfs_list = LIST_HEAD_INITIALIZER(etfs_list);
166 1.21 pooka
167 1.21 pooka static enum vtype
168 1.21 pooka ettype_to_vtype(enum rump_etfs_type et)
169 1.21 pooka {
170 1.21 pooka enum vtype vt;
171 1.21 pooka
172 1.21 pooka switch (et) {
173 1.21 pooka case RUMP_ETFS_REG:
174 1.21 pooka vt = VREG;
175 1.21 pooka break;
176 1.21 pooka case RUMP_ETFS_BLK:
177 1.21 pooka vt = VBLK;
178 1.21 pooka break;
179 1.21 pooka case RUMP_ETFS_CHR:
180 1.21 pooka vt = VCHR;
181 1.21 pooka break;
182 1.21 pooka default:
183 1.21 pooka panic("invalid et type: %d", et);
184 1.21 pooka }
185 1.21 pooka
186 1.21 pooka return vt;
187 1.21 pooka }
188 1.21 pooka
189 1.21 pooka static bool
190 1.21 pooka etfs_find(const char *key, struct rumpfs_node **rnp)
191 1.21 pooka {
192 1.21 pooka struct etfs *et;
193 1.24 pooka size_t keylen = strlen(key);
194 1.21 pooka bool rv = false;
195 1.21 pooka
196 1.21 pooka KASSERT(mutex_owned(&etfs_lock));
197 1.21 pooka
198 1.21 pooka LIST_FOREACH(et, &etfs_list, et_entries) {
199 1.24 pooka if (keylen == et->et_keylen && strcmp(key, et->et_key) == 0) {
200 1.21 pooka *rnp = et->et_rn;
201 1.21 pooka rv = true;
202 1.21 pooka break;
203 1.21 pooka }
204 1.21 pooka }
205 1.21 pooka
206 1.21 pooka return rv;
207 1.21 pooka }
208 1.21 pooka
209 1.25 pooka static int
210 1.25 pooka doregister(const char *key, const char *hostpath,
211 1.25 pooka enum rump_etfs_type ftype, uint64_t begin, uint64_t size)
212 1.21 pooka {
213 1.21 pooka struct etfs *et;
214 1.27 pooka struct rumpfs_node *rn_dummy, *rn;
215 1.21 pooka uint64_t fsize;
216 1.24 pooka dev_t rdev = NODEV;
217 1.21 pooka devminor_t dmin;
218 1.21 pooka int hft, error;
219 1.21 pooka
220 1.21 pooka if (rumpuser_getfileinfo(hostpath, &fsize, &hft, &error))
221 1.21 pooka return error;
222 1.21 pooka
223 1.25 pooka /* check that we give sensible arguments */
224 1.25 pooka if (begin > fsize)
225 1.25 pooka return EINVAL;
226 1.25 pooka if (size == RUMP_ETFS_SIZE_ENDOFF)
227 1.25 pooka size = fsize - begin;
228 1.25 pooka if (begin + size > fsize)
229 1.25 pooka return EINVAL;
230 1.25 pooka
231 1.24 pooka if (ftype == RUMP_ETFS_BLK || ftype == RUMP_ETFS_CHR) {
232 1.25 pooka error = rumpblk_register(hostpath, &dmin, begin, size);
233 1.24 pooka if (error != 0) {
234 1.24 pooka return error;
235 1.24 pooka }
236 1.24 pooka rdev = makedev(RUMPBLK, dmin);
237 1.21 pooka }
238 1.21 pooka
239 1.21 pooka et = kmem_alloc(sizeof(*et), KM_SLEEP);
240 1.21 pooka strcpy(et->et_key, key);
241 1.24 pooka et->et_keylen = strlen(et->et_key);
242 1.27 pooka et->et_rn = rn = makeprivate(ettype_to_vtype(ftype), rdev, size);
243 1.27 pooka if (ftype == RUMP_ETFS_REG) {
244 1.27 pooka size_t len = strlen(hostpath)+1;
245 1.27 pooka
246 1.27 pooka rn->rn_hostpath = malloc(len, M_TEMP, M_WAITOK | M_ZERO);
247 1.27 pooka memcpy(rn->rn_hostpath, hostpath, len);
248 1.27 pooka rn->rn_offset = begin;
249 1.27 pooka }
250 1.21 pooka
251 1.21 pooka mutex_enter(&etfs_lock);
252 1.21 pooka if (etfs_find(key, &rn_dummy)) {
253 1.21 pooka mutex_exit(&etfs_lock);
254 1.21 pooka kmem_free(et, sizeof(*et));
255 1.21 pooka /* XXX: rumpblk_deregister(hostpath); */
256 1.21 pooka return EEXIST;
257 1.21 pooka }
258 1.21 pooka LIST_INSERT_HEAD(&etfs_list, et, et_entries);
259 1.21 pooka mutex_exit(&etfs_lock);
260 1.21 pooka
261 1.21 pooka return 0;
262 1.21 pooka }
263 1.21 pooka
264 1.21 pooka int
265 1.29 pooka rump_etfs_register(const char *key, const char *hostpath,
266 1.25 pooka enum rump_etfs_type ftype)
267 1.25 pooka {
268 1.25 pooka
269 1.25 pooka return doregister(key, hostpath, ftype, 0, RUMP_ETFS_SIZE_ENDOFF);
270 1.25 pooka }
271 1.25 pooka
272 1.25 pooka int
273 1.29 pooka rump_etfs_register_withsize(const char *key, const char *hostpath,
274 1.25 pooka enum rump_etfs_type ftype, uint64_t begin, uint64_t size)
275 1.25 pooka {
276 1.25 pooka
277 1.25 pooka /*
278 1.25 pooka * Check that we're mapping at block offsets. I guess this
279 1.25 pooka * is not technically necessary except for BLK/CHR backends
280 1.25 pooka * (i.e. what getfileinfo() returns, not ftype) and can be
281 1.25 pooka * removed later if there are problems.
282 1.25 pooka */
283 1.25 pooka if ((begin & (DEV_BSIZE-1)) != 0)
284 1.25 pooka return EINVAL;
285 1.25 pooka if (size != RUMP_ETFS_SIZE_ENDOFF && (size & (DEV_BSIZE-1)) != 0)
286 1.25 pooka return EINVAL;
287 1.25 pooka
288 1.25 pooka return doregister(key, hostpath, ftype, begin, size);
289 1.25 pooka }
290 1.25 pooka
291 1.25 pooka int
292 1.29 pooka rump_etfs_remove(const char *key)
293 1.21 pooka {
294 1.21 pooka struct etfs *et;
295 1.24 pooka size_t keylen = strlen(key);
296 1.21 pooka
297 1.21 pooka mutex_enter(&etfs_lock);
298 1.21 pooka LIST_FOREACH(et, &etfs_list, et_entries) {
299 1.24 pooka if (keylen == et->et_keylen && strcmp(et->et_key, key) == 0) {
300 1.21 pooka LIST_REMOVE(et, et_entries);
301 1.21 pooka kmem_free(et, sizeof(*et));
302 1.21 pooka break;
303 1.21 pooka }
304 1.21 pooka }
305 1.21 pooka mutex_exit(&etfs_lock);
306 1.21 pooka
307 1.21 pooka if (!et)
308 1.21 pooka return ENOENT;
309 1.21 pooka return 0;
310 1.21 pooka }
311 1.21 pooka
312 1.21 pooka /*
313 1.21 pooka * rumpfs
314 1.21 pooka */
315 1.21 pooka
316 1.21 pooka static int lastino = 1;
317 1.21 pooka static kmutex_t reclock;
318 1.21 pooka
319 1.14 pooka static struct rumpfs_node *
320 1.27 pooka makeprivate(enum vtype vt, dev_t rdev, off_t size)
321 1.9 pooka {
322 1.14 pooka struct rumpfs_node *rn;
323 1.9 pooka struct vattr *va;
324 1.9 pooka struct timespec ts;
325 1.9 pooka
326 1.23 pooka rn = kmem_zalloc(sizeof(*rn), KM_SLEEP);
327 1.24 pooka
328 1.24 pooka switch (vt) {
329 1.24 pooka case VDIR:
330 1.24 pooka LIST_INIT(&rn->rn_dir);
331 1.24 pooka break;
332 1.24 pooka case VREG:
333 1.24 pooka rn->rn_readfd = -1;
334 1.24 pooka rn->rn_writefd = -1;
335 1.24 pooka break;
336 1.24 pooka default:
337 1.24 pooka break;
338 1.24 pooka }
339 1.24 pooka
340 1.9 pooka nanotime(&ts);
341 1.9 pooka
342 1.14 pooka va = &rn->rn_va;
343 1.9 pooka va->va_type = vt;
344 1.9 pooka va->va_mode = 0755;
345 1.14 pooka if (vt == VDIR)
346 1.14 pooka va->va_nlink = 2;
347 1.14 pooka else
348 1.14 pooka va->va_nlink = 1;
349 1.9 pooka va->va_uid = 0;
350 1.9 pooka va->va_gid = 0;
351 1.9 pooka va->va_fsid =
352 1.9 pooka va->va_fileid = atomic_inc_uint_nv(&lastino);
353 1.19 pooka va->va_size = size;
354 1.9 pooka va->va_blocksize = 512;
355 1.9 pooka va->va_atime = ts;
356 1.9 pooka va->va_mtime = ts;
357 1.9 pooka va->va_ctime = ts;
358 1.9 pooka va->va_birthtime = ts;
359 1.9 pooka va->va_gen = 0;
360 1.9 pooka va->va_flags = 0;
361 1.19 pooka va->va_rdev = rdev;
362 1.9 pooka va->va_bytes = 512;
363 1.9 pooka va->va_filerev = 0;
364 1.9 pooka va->va_vaflags = 0;
365 1.9 pooka
366 1.14 pooka return rn;
367 1.9 pooka }
368 1.1 pooka
369 1.6 pooka static int
370 1.30 pooka makevnode(struct mount *mp, struct rumpfs_node *rn, struct vnode **vpp)
371 1.1 pooka {
372 1.1 pooka struct vnode *vp;
373 1.12 pooka int (**vpops)(void *);
374 1.21 pooka struct vattr *va = &rn->rn_va;
375 1.6 pooka int rv;
376 1.1 pooka
377 1.21 pooka KASSERT(mutex_owned(&reclock));
378 1.21 pooka
379 1.21 pooka if (va->va_type == VCHR || va->va_type == VBLK) {
380 1.19 pooka vpops = rump_specop_p;
381 1.12 pooka } else {
382 1.12 pooka vpops = rump_vnodeop_p;
383 1.12 pooka }
384 1.24 pooka if (vpops != rump_specop_p && va->va_type != VDIR
385 1.26 pooka && !(va->va_type == VREG && rn->rn_hostpath != NULL)
386 1.26 pooka && va->va_type != VSOCK)
387 1.21 pooka return EOPNOTSUPP;
388 1.12 pooka
389 1.30 pooka rv = getnewvnode(VT_RUMP, mp, vpops, &vp);
390 1.12 pooka if (rv)
391 1.12 pooka return rv;
392 1.12 pooka
393 1.21 pooka vp->v_size = vp->v_writesize = va->va_size;
394 1.21 pooka vp->v_type = va->va_type;
395 1.1 pooka
396 1.21 pooka if (vpops == rump_specop_p) {
397 1.21 pooka spec_node_init(vp, va->va_rdev);
398 1.14 pooka }
399 1.19 pooka vp->v_data = rn;
400 1.14 pooka
401 1.14 pooka vn_lock(vp, LK_RETRY | LK_EXCLUSIVE);
402 1.21 pooka rn->rn_vp = vp;
403 1.6 pooka *vpp = vp;
404 1.6 pooka
405 1.6 pooka return 0;
406 1.1 pooka }
407 1.1 pooka
408 1.1 pooka /*
409 1.14 pooka * Simple lookup for faking lookup of device entry for rump file systems
410 1.14 pooka * and for locating/creating directories. Yes, this will panic if you
411 1.14 pooka * call it with the wrong arguments.
412 1.21 pooka *
413 1.21 pooka * uhm, this is twisted. C F C C, hope of C C F C looming
414 1.1 pooka */
415 1.1 pooka static int
416 1.1 pooka rump_vop_lookup(void *v)
417 1.1 pooka {
418 1.1 pooka struct vop_lookup_args /* {
419 1.1 pooka struct vnode *a_dvp;
420 1.1 pooka struct vnode **a_vpp;
421 1.1 pooka struct componentname *a_cnp;
422 1.1 pooka }; */ *ap = v;
423 1.1 pooka struct componentname *cnp = ap->a_cnp;
424 1.14 pooka struct vnode *dvp = ap->a_dvp;
425 1.14 pooka struct vnode **vpp = ap->a_vpp;
426 1.14 pooka struct vnode *vp;
427 1.21 pooka struct rumpfs_node *rnd = dvp->v_data, *rn;
428 1.21 pooka struct rumpfs_dent *rd = NULL;
429 1.21 pooka int rv;
430 1.1 pooka
431 1.1 pooka /* we handle only some "non-special" cases */
432 1.20 pooka if (!(((cnp->cn_flags & ISLASTCN) == 0)
433 1.20 pooka || (cnp->cn_nameiop == LOOKUP || cnp->cn_nameiop == CREATE)))
434 1.20 pooka return EOPNOTSUPP;
435 1.20 pooka if (!((cnp->cn_flags & ISDOTDOT) == 0))
436 1.20 pooka return EOPNOTSUPP;
437 1.20 pooka if (!(cnp->cn_namelen != 0 && cnp->cn_pnbuf[0] != '.'))
438 1.20 pooka return EOPNOTSUPP;
439 1.1 pooka
440 1.14 pooka /* check if we are returning a faked block device */
441 1.14 pooka if (dvp == rootvnode && cnp->cn_nameiop == LOOKUP) {
442 1.21 pooka mutex_enter(&etfs_lock);
443 1.21 pooka if (etfs_find(cnp->cn_pnbuf, &rn)) {
444 1.21 pooka mutex_exit(&etfs_lock);
445 1.14 pooka cnp->cn_consume = strlen(cnp->cn_nameptr
446 1.14 pooka + cnp->cn_namelen);
447 1.14 pooka cnp->cn_flags &= ~REQUIREDIR;
448 1.21 pooka goto getvnode;
449 1.14 pooka }
450 1.21 pooka mutex_exit(&etfs_lock);
451 1.14 pooka }
452 1.14 pooka
453 1.21 pooka if (!rd) {
454 1.21 pooka LIST_FOREACH(rd, &rnd->rn_dir, rd_entries) {
455 1.21 pooka if (strncmp(rd->rd_name, cnp->cn_nameptr,
456 1.21 pooka cnp->cn_namelen) == 0)
457 1.21 pooka break;
458 1.21 pooka }
459 1.14 pooka }
460 1.14 pooka
461 1.14 pooka if (!rd && ((cnp->cn_flags & ISLASTCN) == 0||cnp->cn_nameiop != CREATE))
462 1.14 pooka return ENOENT;
463 1.14 pooka
464 1.14 pooka if (!rd && (cnp->cn_flags & ISLASTCN) && cnp->cn_nameiop == CREATE) {
465 1.14 pooka cnp->cn_flags |= SAVENAME;
466 1.14 pooka return EJUSTRETURN;
467 1.7 pooka }
468 1.21 pooka rn = rd->rd_node;
469 1.21 pooka rd = NULL;
470 1.1 pooka
471 1.21 pooka getvnode:
472 1.21 pooka KASSERT(rn);
473 1.14 pooka mutex_enter(&reclock);
474 1.21 pooka if ((vp = rn->rn_vp)) {
475 1.14 pooka mutex_enter(&vp->v_interlock);
476 1.14 pooka mutex_exit(&reclock);
477 1.14 pooka if (vget(vp, LK_EXCLUSIVE | LK_INTERLOCK))
478 1.21 pooka goto getvnode;
479 1.14 pooka *vpp = vp;
480 1.14 pooka } else {
481 1.30 pooka rv = makevnode(dvp->v_mount, rn, vpp);
482 1.21 pooka rn->rn_vp = *vpp;
483 1.21 pooka mutex_exit(&reclock);
484 1.14 pooka if (rv)
485 1.14 pooka return rv;
486 1.14 pooka }
487 1.1 pooka
488 1.1 pooka return 0;
489 1.1 pooka }
490 1.1 pooka
491 1.9 pooka static int
492 1.9 pooka rump_vop_getattr(void *v)
493 1.9 pooka {
494 1.9 pooka struct vop_getattr_args /* {
495 1.9 pooka struct vnode *a_vp;
496 1.9 pooka struct vattr *a_vap;
497 1.9 pooka kauth_cred_t a_cred;
498 1.9 pooka } */ *ap = v;
499 1.14 pooka struct rumpfs_node *rn = ap->a_vp->v_data;
500 1.9 pooka
501 1.14 pooka memcpy(ap->a_vap, &rn->rn_va, sizeof(struct vattr));
502 1.9 pooka return 0;
503 1.9 pooka }
504 1.9 pooka
505 1.9 pooka static int
506 1.14 pooka rump_vop_mkdir(void *v)
507 1.14 pooka {
508 1.14 pooka struct vop_mkdir_args /* {
509 1.14 pooka struct vnode *a_dvp;
510 1.14 pooka struct vnode **a_vpp;
511 1.14 pooka struct componentname *a_cnp;
512 1.14 pooka struct vattr *a_vap;
513 1.14 pooka }; */ *ap = v;
514 1.14 pooka struct vnode *dvp = ap->a_dvp;
515 1.14 pooka struct vnode **vpp = ap->a_vpp;
516 1.14 pooka struct componentname *cnp = ap->a_cnp;
517 1.21 pooka struct rumpfs_node *rnd = dvp->v_data, *rn;
518 1.14 pooka struct rumpfs_dent *rdent;
519 1.14 pooka int rv = 0;
520 1.14 pooka
521 1.27 pooka rn = makeprivate(VDIR, NODEV, DEV_BSIZE);
522 1.21 pooka mutex_enter(&reclock);
523 1.30 pooka rv = makevnode(dvp->v_mount, rn, vpp);
524 1.21 pooka mutex_exit(&reclock);
525 1.21 pooka if (rv)
526 1.14 pooka goto out;
527 1.14 pooka
528 1.14 pooka rdent = kmem_alloc(sizeof(*rdent), KM_SLEEP);
529 1.14 pooka rdent->rd_name = kmem_alloc(cnp->cn_namelen+1, KM_SLEEP);
530 1.14 pooka rdent->rd_node = (*vpp)->v_data;
531 1.14 pooka strlcpy(rdent->rd_name, cnp->cn_nameptr, cnp->cn_namelen+1);
532 1.14 pooka
533 1.14 pooka LIST_INSERT_HEAD(&rnd->rn_dir, rdent, rd_entries);
534 1.14 pooka
535 1.14 pooka out:
536 1.14 pooka vput(dvp);
537 1.14 pooka return rv;
538 1.14 pooka }
539 1.14 pooka
540 1.14 pooka static int
541 1.19 pooka rump_vop_mknod(void *v)
542 1.19 pooka {
543 1.19 pooka struct vop_mknod_args /* {
544 1.19 pooka struct vnode *a_dvp;
545 1.19 pooka struct vnode **a_vpp;
546 1.19 pooka struct componentname *a_cnp;
547 1.19 pooka struct vattr *a_vap;
548 1.19 pooka }; */ *ap = v;
549 1.19 pooka struct vnode *dvp = ap->a_dvp;
550 1.19 pooka struct vnode **vpp = ap->a_vpp;
551 1.19 pooka struct componentname *cnp = ap->a_cnp;
552 1.19 pooka struct vattr *va = ap->a_vap;
553 1.21 pooka struct rumpfs_node *rnd = dvp->v_data, *rn;
554 1.19 pooka struct rumpfs_dent *rdent;
555 1.19 pooka int rv;
556 1.19 pooka
557 1.27 pooka rn = makeprivate(va->va_type, va->va_rdev, DEV_BSIZE);
558 1.21 pooka mutex_enter(&reclock);
559 1.30 pooka rv = makevnode(dvp->v_mount, rn, vpp);
560 1.21 pooka mutex_exit(&reclock);
561 1.21 pooka if (rv)
562 1.19 pooka goto out;
563 1.19 pooka
564 1.19 pooka rdent = kmem_alloc(sizeof(*rdent), KM_SLEEP);
565 1.19 pooka rdent->rd_name = kmem_alloc(cnp->cn_namelen+1, KM_SLEEP);
566 1.19 pooka rdent->rd_node = (*vpp)->v_data;
567 1.19 pooka rdent->rd_node->rn_va.va_rdev = va->va_rdev;
568 1.19 pooka strlcpy(rdent->rd_name, cnp->cn_nameptr, cnp->cn_namelen+1);
569 1.19 pooka
570 1.19 pooka LIST_INSERT_HEAD(&rnd->rn_dir, rdent, rd_entries);
571 1.19 pooka
572 1.19 pooka out:
573 1.19 pooka vput(dvp);
574 1.19 pooka return rv;
575 1.19 pooka }
576 1.19 pooka
577 1.19 pooka static int
578 1.26 pooka rump_vop_create(void *v)
579 1.26 pooka {
580 1.26 pooka struct vop_create_args /* {
581 1.26 pooka struct vnode *a_dvp;
582 1.26 pooka struct vnode **a_vpp;
583 1.26 pooka struct componentname *a_cnp;
584 1.26 pooka struct vattr *a_vap;
585 1.26 pooka }; */ *ap = v;
586 1.26 pooka struct vnode *dvp = ap->a_dvp;
587 1.26 pooka struct vnode **vpp = ap->a_vpp;
588 1.26 pooka struct componentname *cnp = ap->a_cnp;
589 1.26 pooka struct vattr *va = ap->a_vap;
590 1.26 pooka struct rumpfs_node *rnd = dvp->v_data, *rn;
591 1.26 pooka struct rumpfs_dent *rdent;
592 1.26 pooka int rv;
593 1.26 pooka
594 1.26 pooka if (va->va_type != VSOCK) {
595 1.26 pooka rv = EOPNOTSUPP;
596 1.26 pooka goto out;
597 1.26 pooka }
598 1.27 pooka rn = makeprivate(VSOCK, NODEV, DEV_BSIZE);
599 1.26 pooka mutex_enter(&reclock);
600 1.30 pooka rv = makevnode(dvp->v_mount, rn, vpp);
601 1.26 pooka mutex_exit(&reclock);
602 1.26 pooka if (rv)
603 1.26 pooka goto out;
604 1.26 pooka
605 1.26 pooka rdent = kmem_alloc(sizeof(*rdent), KM_SLEEP);
606 1.26 pooka rdent->rd_name = kmem_alloc(cnp->cn_namelen+1, KM_SLEEP);
607 1.26 pooka rdent->rd_node = (*vpp)->v_data;
608 1.26 pooka rdent->rd_node->rn_va.va_rdev = NODEV;
609 1.26 pooka strlcpy(rdent->rd_name, cnp->cn_nameptr, cnp->cn_namelen+1);
610 1.26 pooka
611 1.26 pooka LIST_INSERT_HEAD(&rnd->rn_dir, rdent, rd_entries);
612 1.26 pooka
613 1.26 pooka out:
614 1.26 pooka vput(dvp);
615 1.26 pooka return rv;
616 1.26 pooka }
617 1.26 pooka
618 1.26 pooka static int
619 1.24 pooka rump_vop_open(void *v)
620 1.24 pooka {
621 1.24 pooka struct vop_open_args /* {
622 1.24 pooka struct vnode *a_vp;
623 1.24 pooka int a_mode;
624 1.24 pooka kauth_cred_t a_cred;
625 1.24 pooka } */ *ap = v;
626 1.24 pooka struct vnode *vp = ap->a_vp;
627 1.24 pooka struct rumpfs_node *rn = vp->v_data;
628 1.24 pooka int mode = ap->a_mode;
629 1.24 pooka int error = EINVAL;
630 1.24 pooka
631 1.24 pooka if (vp->v_type != VREG)
632 1.24 pooka return 0;
633 1.24 pooka
634 1.24 pooka if (mode & FREAD) {
635 1.24 pooka if (rn->rn_readfd != -1)
636 1.24 pooka return 0;
637 1.24 pooka rn->rn_readfd = rumpuser_open(rn->rn_hostpath,
638 1.24 pooka O_RDONLY, &error);
639 1.24 pooka } else if (mode & FWRITE) {
640 1.24 pooka if (rn->rn_writefd != -1)
641 1.24 pooka return 0;
642 1.24 pooka rn->rn_writefd = rumpuser_open(rn->rn_hostpath,
643 1.24 pooka O_WRONLY, &error);
644 1.24 pooka }
645 1.24 pooka
646 1.24 pooka return error;
647 1.24 pooka }
648 1.24 pooka
649 1.24 pooka static int
650 1.24 pooka rump_vop_read(void *v)
651 1.24 pooka {
652 1.24 pooka struct vop_read_args /* {
653 1.24 pooka struct vnode *a_vp;
654 1.24 pooka struct uio *a_uio;
655 1.24 pooka int ioflags a_ioflag;
656 1.24 pooka kauth_cred_t a_cred;
657 1.24 pooka }; */ *ap = v;
658 1.24 pooka struct vnode *vp = ap->a_vp;
659 1.24 pooka struct rumpfs_node *rn = vp->v_data;
660 1.24 pooka struct uio *uio = ap->a_uio;
661 1.24 pooka uint8_t *buf;
662 1.24 pooka size_t bufsize;
663 1.24 pooka int error = 0;
664 1.24 pooka
665 1.24 pooka bufsize = uio->uio_resid;
666 1.24 pooka buf = kmem_alloc(bufsize, KM_SLEEP);
667 1.27 pooka if (rumpuser_pread(rn->rn_readfd, buf, bufsize,
668 1.27 pooka uio->uio_offset + rn->rn_offset, &error) == -1)
669 1.24 pooka goto out;
670 1.24 pooka error = uiomove(buf, bufsize, uio);
671 1.24 pooka
672 1.24 pooka out:
673 1.24 pooka kmem_free(buf, bufsize);
674 1.24 pooka return error;
675 1.24 pooka }
676 1.24 pooka
677 1.24 pooka static int
678 1.24 pooka rump_vop_write(void *v)
679 1.24 pooka {
680 1.24 pooka struct vop_read_args /* {
681 1.24 pooka struct vnode *a_vp;
682 1.24 pooka struct uio *a_uio;
683 1.24 pooka int ioflags a_ioflag;
684 1.24 pooka kauth_cred_t a_cred;
685 1.24 pooka }; */ *ap = v;
686 1.24 pooka struct vnode *vp = ap->a_vp;
687 1.24 pooka struct rumpfs_node *rn = vp->v_data;
688 1.24 pooka struct uio *uio = ap->a_uio;
689 1.24 pooka uint8_t *buf;
690 1.24 pooka size_t bufsize;
691 1.24 pooka int error = 0;
692 1.24 pooka
693 1.24 pooka bufsize = uio->uio_resid;
694 1.24 pooka buf = kmem_alloc(bufsize, KM_SLEEP);
695 1.24 pooka error = uiomove(buf, bufsize, uio);
696 1.24 pooka if (error)
697 1.24 pooka goto out;
698 1.24 pooka KASSERT(uio->uio_resid == 0);
699 1.27 pooka rumpuser_pwrite(rn->rn_writefd, buf, bufsize,
700 1.27 pooka uio->uio_offset + rn->rn_offset, &error);
701 1.24 pooka
702 1.24 pooka out:
703 1.24 pooka kmem_free(buf, bufsize);
704 1.24 pooka return error;
705 1.24 pooka }
706 1.24 pooka
707 1.24 pooka static int
708 1.9 pooka rump_vop_success(void *v)
709 1.9 pooka {
710 1.9 pooka
711 1.9 pooka return 0;
712 1.9 pooka }
713 1.9 pooka
714 1.12 pooka static int
715 1.14 pooka rump_vop_inactive(void *v)
716 1.14 pooka {
717 1.14 pooka struct vop_inactive_args *ap = v;
718 1.24 pooka struct vnode *vp = ap->a_vp;
719 1.24 pooka struct rumpfs_node *rn = vp->v_data;
720 1.24 pooka int error;
721 1.14 pooka
722 1.24 pooka if (vp->v_type == VREG) {
723 1.24 pooka if (rn->rn_readfd != -1) {
724 1.24 pooka rumpuser_close(rn->rn_readfd, &error);
725 1.24 pooka rn->rn_readfd = -1;
726 1.24 pooka }
727 1.24 pooka if (rn->rn_writefd != -1) {
728 1.24 pooka rumpuser_close(rn->rn_writefd, &error);
729 1.24 pooka rn->rn_writefd = -1;
730 1.24 pooka }
731 1.24 pooka }
732 1.24 pooka
733 1.24 pooka VOP_UNLOCK(vp, 0);
734 1.14 pooka return 0;
735 1.14 pooka }
736 1.14 pooka
737 1.14 pooka static int
738 1.12 pooka rump_vop_reclaim(void *v)
739 1.12 pooka {
740 1.12 pooka struct vop_reclaim_args /* {
741 1.12 pooka struct vnode *a_vp;
742 1.12 pooka } */ *ap = v;
743 1.12 pooka struct vnode *vp = ap->a_vp;
744 1.14 pooka struct rumpfs_node *rn = vp->v_data;
745 1.12 pooka
746 1.14 pooka mutex_enter(&reclock);
747 1.14 pooka rn->rn_vp = NULL;
748 1.14 pooka mutex_exit(&reclock);
749 1.12 pooka vp->v_data = NULL;
750 1.12 pooka
751 1.12 pooka return 0;
752 1.12 pooka }
753 1.12 pooka
754 1.19 pooka static int
755 1.19 pooka rump_vop_spec(void *v)
756 1.19 pooka {
757 1.19 pooka struct vop_generic_args *ap = v;
758 1.19 pooka int (**opvec)(void *);
759 1.19 pooka
760 1.19 pooka switch (ap->a_desc->vdesc_offset) {
761 1.19 pooka case VOP_ACCESS_DESCOFFSET:
762 1.19 pooka case VOP_GETATTR_DESCOFFSET:
763 1.22 pooka case VOP_LOCK_DESCOFFSET:
764 1.22 pooka case VOP_UNLOCK_DESCOFFSET:
765 1.19 pooka opvec = rump_vnodeop_p;
766 1.19 pooka break;
767 1.19 pooka default:
768 1.19 pooka opvec = spec_vnodeop_p;
769 1.19 pooka break;
770 1.19 pooka }
771 1.19 pooka
772 1.19 pooka return VOCALL(opvec, ap->a_desc->vdesc_offset, v);
773 1.19 pooka }
774 1.19 pooka
775 1.30 pooka /*
776 1.30 pooka * Begin vfs-level stuff
777 1.30 pooka */
778 1.30 pooka
779 1.30 pooka VFS_PROTOS(rumpfs);
780 1.30 pooka struct vfsops rumpfs_vfsops = {
781 1.30 pooka .vfs_name = MOUNT_RUMPFS,
782 1.30 pooka .vfs_min_mount_data = 0,
783 1.30 pooka .vfs_mount = rumpfs_mount,
784 1.30 pooka .vfs_start = (void *)nullop,
785 1.30 pooka .vfs_unmount = rumpfs_unmount,
786 1.30 pooka .vfs_root = rumpfs_root,
787 1.30 pooka .vfs_quotactl = (void *)eopnotsupp,
788 1.30 pooka .vfs_sync = (void *)nullop,
789 1.30 pooka .vfs_vget = rumpfs_vget,
790 1.30 pooka .vfs_fhtovp = (void *)eopnotsupp,
791 1.30 pooka .vfs_vptofh = (void *)eopnotsupp,
792 1.30 pooka .vfs_init = rumpfs_init,
793 1.30 pooka .vfs_reinit = NULL,
794 1.30 pooka .vfs_done = rumpfs_done,
795 1.30 pooka .vfs_mountroot = rumpfs_mountroot,
796 1.30 pooka .vfs_snapshot = (void *)eopnotsupp,
797 1.30 pooka .vfs_extattrctl = (void *)eopnotsupp,
798 1.30 pooka .vfs_suspendctl = (void *)eopnotsupp,
799 1.30 pooka .vfs_opv_descs = rump_opv_descs,
800 1.30 pooka /* vfs_refcount */
801 1.30 pooka /* vfs_list */
802 1.30 pooka };
803 1.30 pooka
804 1.30 pooka int
805 1.30 pooka rumpfs_mount(struct mount *mp, const char *mntpath, void *arg, size_t *alen)
806 1.30 pooka {
807 1.30 pooka
808 1.30 pooka return EOPNOTSUPP;
809 1.30 pooka }
810 1.30 pooka
811 1.30 pooka int
812 1.30 pooka rumpfs_unmount(struct mount *mp, int flags)
813 1.30 pooka {
814 1.30 pooka
815 1.30 pooka return EOPNOTSUPP; /* ;) */
816 1.30 pooka }
817 1.30 pooka
818 1.30 pooka int
819 1.30 pooka rumpfs_root(struct mount *mp, struct vnode **vpp)
820 1.30 pooka {
821 1.30 pooka struct rumpfs_mount *rfsmp = mp->mnt_data;
822 1.30 pooka
823 1.30 pooka vget(rfsmp->rfsmp_rvp, LK_EXCLUSIVE | LK_RETRY);
824 1.30 pooka *vpp = rfsmp->rfsmp_rvp;
825 1.30 pooka return 0;
826 1.30 pooka }
827 1.30 pooka
828 1.30 pooka int
829 1.30 pooka rumpfs_vget(struct mount *mp, ino_t ino, struct vnode **vpp)
830 1.30 pooka {
831 1.30 pooka
832 1.30 pooka return EOPNOTSUPP;
833 1.30 pooka }
834 1.30 pooka
835 1.1 pooka void
836 1.30 pooka rumpfs_init()
837 1.1 pooka {
838 1.1 pooka
839 1.25 pooka CTASSERT(RUMP_ETFS_SIZE_ENDOFF == RUMPBLK_SIZENOTSET);
840 1.25 pooka
841 1.14 pooka mutex_init(&reclock, MUTEX_DEFAULT, IPL_NONE);
842 1.21 pooka mutex_init(&etfs_lock, MUTEX_DEFAULT, IPL_NONE);
843 1.30 pooka }
844 1.30 pooka
845 1.30 pooka void
846 1.30 pooka rumpfs_done()
847 1.30 pooka {
848 1.30 pooka
849 1.30 pooka mutex_destroy(&reclock);
850 1.30 pooka mutex_destroy(&etfs_lock);
851 1.30 pooka }
852 1.14 pooka
853 1.30 pooka int
854 1.30 pooka rumpfs_mountroot()
855 1.30 pooka {
856 1.30 pooka struct mount *mp;
857 1.30 pooka struct rumpfs_mount *rfsmp;
858 1.30 pooka struct rumpfs_node *rn;
859 1.30 pooka int error;
860 1.30 pooka
861 1.30 pooka if ((error = vfs_rootmountalloc(MOUNT_RUMPFS, "rootdev", &mp)) != 0) {
862 1.30 pooka vrele(rootvp);
863 1.30 pooka return error;
864 1.30 pooka }
865 1.30 pooka
866 1.30 pooka rfsmp = kmem_alloc(sizeof(*rfsmp), KM_SLEEP);
867 1.12 pooka
868 1.27 pooka rn = makeprivate(VDIR, NODEV, DEV_BSIZE);
869 1.21 pooka mutex_enter(&reclock);
870 1.30 pooka error = makevnode(mp, rn, &rfsmp->rfsmp_rvp);
871 1.21 pooka mutex_exit(&reclock);
872 1.30 pooka rfsmp->rfsmp_rvp->v_vflag |= VV_ROOT;
873 1.30 pooka if (error)
874 1.30 pooka panic("could not create root vnode: %d", error);
875 1.30 pooka mp->mnt_data = rfsmp;
876 1.30 pooka VOP_UNLOCK(rfsmp->rfsmp_rvp, 0);
877 1.30 pooka
878 1.30 pooka mp->mnt_flag |= MNT_ROOTFS;
879 1.30 pooka rumpfs_vfsops.vfs_refcount++;
880 1.30 pooka
881 1.30 pooka mutex_enter(&mountlist_lock);
882 1.30 pooka CIRCLEQ_INSERT_TAIL(&mountlist, mp, mnt_list);
883 1.30 pooka mutex_exit(&mountlist_lock);
884 1.30 pooka
885 1.30 pooka vfs_unbusy(mp, false, NULL);
886 1.30 pooka
887 1.30 pooka return 0;
888 1.30 pooka }
889 1.30 pooka
890 1.30 pooka MODULE(MODULE_CLASS_VFS, rumpfs, NULL);
891 1.30 pooka
892 1.30 pooka static int
893 1.30 pooka rumpfs_modcmd(modcmd_t cmd, void *arg)
894 1.30 pooka {
895 1.30 pooka
896 1.30 pooka switch (cmd) {
897 1.30 pooka case MODULE_CMD_INIT:
898 1.30 pooka return vfs_attach(&rumpfs_vfsops);
899 1.30 pooka case MODULE_CMD_FINI:
900 1.30 pooka return vfs_detach(&rumpfs_vfsops);
901 1.30 pooka default:
902 1.30 pooka return ENOTTY;
903 1.30 pooka }
904 1.1 pooka }
905