puffs_vnops.c revision 1.82 1 /* $NetBSD: puffs_vnops.c,v 1.82 2007/07/01 17:22:18 pooka Exp $ */
2
3 /*
4 * Copyright (c) 2005, 2006, 2007 Antti Kantee. All Rights Reserved.
5 *
6 * Development of this software was supported by the
7 * Google Summer of Code program and the Ulla Tuominen Foundation.
8 * The Google SoC project was mentored by Bill Studenmund.
9 *
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
12 * are met:
13 * 1. Redistributions of source code must retain the above copyright
14 * notice, this list of conditions and the following disclaimer.
15 * 2. Redistributions in binary form must reproduce the above copyright
16 * notice, this list of conditions and the following disclaimer in the
17 * documentation and/or other materials provided with the distribution.
18 *
19 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
20 * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
21 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
22 * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
23 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
25 * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 * SUCH DAMAGE.
30 */
31
32 #include <sys/cdefs.h>
33 __KERNEL_RCSID(0, "$NetBSD: puffs_vnops.c,v 1.82 2007/07/01 17:22:18 pooka Exp $");
34
35 #include <sys/param.h>
36 #include <sys/fstrans.h>
37 #include <sys/malloc.h>
38 #include <sys/mount.h>
39 #include <sys/namei.h>
40 #include <sys/vnode.h>
41 #include <uvm/uvm.h>
42
43 #include <fs/puffs/puffs_msgif.h>
44 #include <fs/puffs/puffs_sys.h>
45
46 #include <miscfs/fifofs/fifo.h>
47 #include <miscfs/genfs/genfs.h>
48 #include <miscfs/specfs/specdev.h>
49
50 int puffs_lookup(void *);
51 int puffs_create(void *);
52 int puffs_access(void *);
53 int puffs_mknod(void *);
54 int puffs_open(void *);
55 int puffs_close(void *);
56 int puffs_getattr(void *);
57 int puffs_setattr(void *);
58 int puffs_reclaim(void *);
59 int puffs_readdir(void *);
60 int puffs_poll(void *);
61 int puffs_fsync(void *);
62 int puffs_seek(void *);
63 int puffs_remove(void *);
64 int puffs_mkdir(void *);
65 int puffs_rmdir(void *);
66 int puffs_link(void *);
67 int puffs_readlink(void *);
68 int puffs_symlink(void *);
69 int puffs_rename(void *);
70 int puffs_read(void *);
71 int puffs_write(void *);
72 int puffs_fcntl(void *);
73 int puffs_ioctl(void *);
74 int puffs_inactive(void *);
75 int puffs_print(void *);
76 int puffs_pathconf(void *);
77 int puffs_advlock(void *);
78 int puffs_strategy(void *);
79 int puffs_bmap(void *);
80 int puffs_mmap(void *);
81 int puffs_getpages(void *);
82
83 int puffs_spec_read(void *);
84 int puffs_spec_write(void *);
85 int puffs_fifo_read(void *);
86 int puffs_fifo_write(void *);
87
88 int puffs_checkop(void *);
89
90
91 /* VOP_LEASE() not included */
92
93 int puffs_generic(void *);
94
95 #if 0
96 #define puffs_lock genfs_lock
97 #define puffs_unlock genfs_unlock
98 #define puffs_islocked genfs_islocked
99 #else
100 int puffs_lock(void *);
101 int puffs_unlock(void *);
102 int puffs_islocked(void *);
103 #endif
104
105 int (**puffs_vnodeop_p)(void *);
106 const struct vnodeopv_entry_desc puffs_vnodeop_entries[] = {
107 { &vop_default_desc, vn_default_error },
108 { &vop_lookup_desc, puffs_lookup }, /* REAL lookup */
109 { &vop_create_desc, puffs_checkop }, /* create */
110 { &vop_mknod_desc, puffs_checkop }, /* mknod */
111 { &vop_open_desc, puffs_open }, /* REAL open */
112 { &vop_close_desc, puffs_checkop }, /* close */
113 { &vop_access_desc, puffs_access }, /* REAL access */
114 { &vop_getattr_desc, puffs_checkop }, /* getattr */
115 { &vop_setattr_desc, puffs_checkop }, /* setattr */
116 { &vop_read_desc, puffs_checkop }, /* read */
117 { &vop_write_desc, puffs_checkop }, /* write */
118 { &vop_fcntl_desc, puffs_checkop }, /* fcntl */
119 { &vop_ioctl_desc, puffs_checkop }, /* ioctl */
120 { &vop_fsync_desc, puffs_fsync }, /* REAL fsync */
121 { &vop_seek_desc, puffs_checkop }, /* seek */
122 { &vop_remove_desc, puffs_checkop }, /* remove */
123 { &vop_link_desc, puffs_checkop }, /* link */
124 { &vop_rename_desc, puffs_checkop }, /* rename */
125 { &vop_mkdir_desc, puffs_checkop }, /* mkdir */
126 { &vop_rmdir_desc, puffs_checkop }, /* rmdir */
127 { &vop_symlink_desc, puffs_checkop }, /* symlink */
128 { &vop_readdir_desc, puffs_checkop }, /* readdir */
129 { &vop_readlink_desc, puffs_checkop }, /* readlink */
130 { &vop_getpages_desc, puffs_checkop }, /* getpages */
131 { &vop_putpages_desc, genfs_putpages }, /* REAL putpages */
132 { &vop_pathconf_desc, puffs_checkop }, /* pathconf */
133 { &vop_advlock_desc, puffs_checkop }, /* advlock */
134 { &vop_strategy_desc, puffs_strategy }, /* REAL strategy */
135 { &vop_revoke_desc, genfs_revoke }, /* REAL revoke */
136 { &vop_abortop_desc, genfs_abortop }, /* REAL abortop */
137 { &vop_inactive_desc, puffs_inactive }, /* REAL inactive */
138 { &vop_reclaim_desc, puffs_reclaim }, /* REAL reclaim */
139 { &vop_lock_desc, puffs_lock }, /* REAL lock */
140 { &vop_unlock_desc, puffs_unlock }, /* REAL unlock */
141 { &vop_bmap_desc, puffs_bmap }, /* REAL bmap */
142 { &vop_print_desc, puffs_print }, /* REAL print */
143 { &vop_islocked_desc, puffs_islocked }, /* REAL islocked */
144 { &vop_bwrite_desc, genfs_nullop }, /* REAL bwrite */
145 { &vop_mmap_desc, puffs_mmap }, /* REAL mmap */
146 { &vop_poll_desc, puffs_poll }, /* REAL poll */
147
148 { &vop_kqfilter_desc, genfs_eopnotsupp }, /* kqfilter XXX */
149 { NULL, NULL }
150 };
151 const struct vnodeopv_desc puffs_vnodeop_opv_desc =
152 { &puffs_vnodeop_p, puffs_vnodeop_entries };
153
154
155 int (**puffs_specop_p)(void *);
156 const struct vnodeopv_entry_desc puffs_specop_entries[] = {
157 { &vop_default_desc, vn_default_error },
158 { &vop_lookup_desc, spec_lookup }, /* lookup, ENOTDIR */
159 { &vop_create_desc, spec_create }, /* genfs_badop */
160 { &vop_mknod_desc, spec_mknod }, /* genfs_badop */
161 { &vop_open_desc, spec_open }, /* spec_open */
162 { &vop_close_desc, spec_close }, /* spec_close */
163 { &vop_access_desc, puffs_checkop }, /* access */
164 { &vop_getattr_desc, puffs_checkop }, /* getattr */
165 { &vop_setattr_desc, puffs_checkop }, /* setattr */
166 { &vop_read_desc, puffs_spec_read }, /* update, read */
167 { &vop_write_desc, puffs_spec_write }, /* update, write */
168 { &vop_lease_desc, spec_lease_check }, /* genfs_nullop */
169 { &vop_ioctl_desc, spec_ioctl }, /* spec_ioctl */
170 { &vop_fcntl_desc, genfs_fcntl }, /* dummy */
171 { &vop_poll_desc, spec_poll }, /* spec_poll */
172 { &vop_kqfilter_desc, spec_kqfilter }, /* spec_kqfilter */
173 { &vop_revoke_desc, spec_revoke }, /* genfs_revoke */
174 { &vop_mmap_desc, spec_mmap }, /* spec_mmap */
175 { &vop_fsync_desc, spec_fsync }, /* vflushbuf */
176 { &vop_seek_desc, spec_seek }, /* genfs_nullop */
177 { &vop_remove_desc, spec_remove }, /* genfs_badop */
178 { &vop_link_desc, spec_link }, /* genfs_badop */
179 { &vop_rename_desc, spec_rename }, /* genfs_badop */
180 { &vop_mkdir_desc, spec_mkdir }, /* genfs_badop */
181 { &vop_rmdir_desc, spec_rmdir }, /* genfs_badop */
182 { &vop_symlink_desc, spec_symlink }, /* genfs_badop */
183 { &vop_readdir_desc, spec_readdir }, /* genfs_badop */
184 { &vop_readlink_desc, spec_readlink }, /* genfs_badop */
185 { &vop_abortop_desc, spec_abortop }, /* genfs_badop */
186 { &vop_inactive_desc, puffs_inactive }, /* REAL inactive */
187 { &vop_reclaim_desc, puffs_reclaim }, /* REAL reclaim */
188 { &vop_lock_desc, puffs_lock }, /* REAL lock */
189 { &vop_unlock_desc, puffs_unlock }, /* REAL unlock */
190 { &vop_bmap_desc, spec_bmap }, /* dummy */
191 { &vop_strategy_desc, spec_strategy }, /* dev strategy */
192 { &vop_print_desc, puffs_print }, /* REAL print */
193 { &vop_islocked_desc, puffs_islocked }, /* REAL islocked */
194 { &vop_pathconf_desc, spec_pathconf }, /* pathconf */
195 { &vop_advlock_desc, spec_advlock }, /* lf_advlock */
196 { &vop_bwrite_desc, vn_bwrite }, /* bwrite */
197 { &vop_getpages_desc, spec_getpages }, /* genfs_getpages */
198 { &vop_putpages_desc, spec_putpages }, /* genfs_putpages */
199 #if 0
200 { &vop_openextattr_desc, _openextattr }, /* openextattr */
201 { &vop_closeextattr_desc, _closeextattr }, /* closeextattr */
202 { &vop_getextattr_desc, _getextattr }, /* getextattr */
203 { &vop_setextattr_desc, _setextattr }, /* setextattr */
204 { &vop_listextattr_desc, _listextattr }, /* listextattr */
205 { &vop_deleteextattr_desc, _deleteextattr }, /* deleteextattr */
206 #endif
207 { NULL, NULL }
208 };
209 const struct vnodeopv_desc puffs_specop_opv_desc =
210 { &puffs_specop_p, puffs_specop_entries };
211
212
213 int (**puffs_fifoop_p)(void *);
214 const struct vnodeopv_entry_desc puffs_fifoop_entries[] = {
215 { &vop_default_desc, vn_default_error },
216 { &vop_lookup_desc, fifo_lookup }, /* lookup, ENOTDIR */
217 { &vop_create_desc, fifo_create }, /* genfs_badop */
218 { &vop_mknod_desc, fifo_mknod }, /* genfs_badop */
219 { &vop_open_desc, fifo_open }, /* open */
220 { &vop_close_desc, fifo_close }, /* close */
221 { &vop_access_desc, puffs_checkop }, /* access */
222 { &vop_getattr_desc, puffs_checkop }, /* getattr */
223 { &vop_setattr_desc, puffs_checkop }, /* setattr */
224 { &vop_read_desc, puffs_fifo_read }, /* read, update */
225 { &vop_write_desc, puffs_fifo_write }, /* write, update */
226 { &vop_lease_desc, fifo_lease_check }, /* genfs_nullop */
227 { &vop_ioctl_desc, fifo_ioctl }, /* ioctl */
228 { &vop_fcntl_desc, genfs_fcntl }, /* dummy */
229 { &vop_poll_desc, fifo_poll }, /* poll */
230 { &vop_kqfilter_desc, fifo_kqfilter }, /* kqfilter */
231 { &vop_revoke_desc, fifo_revoke }, /* genfs_revoke */
232 { &vop_mmap_desc, fifo_mmap }, /* genfs_badop */
233 { &vop_fsync_desc, fifo_fsync }, /* genfs_nullop*/
234 { &vop_seek_desc, fifo_seek }, /* genfs_badop */
235 { &vop_remove_desc, fifo_remove }, /* genfs_badop */
236 { &vop_link_desc, fifo_link }, /* genfs_badop */
237 { &vop_rename_desc, fifo_rename }, /* genfs_badop */
238 { &vop_mkdir_desc, fifo_mkdir }, /* genfs_badop */
239 { &vop_rmdir_desc, fifo_rmdir }, /* genfs_badop */
240 { &vop_symlink_desc, fifo_symlink }, /* genfs_badop */
241 { &vop_readdir_desc, fifo_readdir }, /* genfs_badop */
242 { &vop_readlink_desc, fifo_readlink }, /* genfs_badop */
243 { &vop_abortop_desc, fifo_abortop }, /* genfs_badop */
244 { &vop_inactive_desc, puffs_inactive }, /* REAL inactive */
245 { &vop_reclaim_desc, puffs_reclaim }, /* REAL reclaim */
246 { &vop_lock_desc, puffs_lock }, /* REAL lock */
247 { &vop_unlock_desc, puffs_unlock }, /* REAL unlock */
248 { &vop_bmap_desc, fifo_bmap }, /* dummy */
249 { &vop_strategy_desc, fifo_strategy }, /* genfs_badop */
250 { &vop_print_desc, puffs_print }, /* REAL print */
251 { &vop_islocked_desc, puffs_islocked }, /* REAL islocked */
252 { &vop_pathconf_desc, fifo_pathconf }, /* pathconf */
253 { &vop_advlock_desc, fifo_advlock }, /* genfs_einval */
254 { &vop_bwrite_desc, vn_bwrite }, /* bwrite */
255 { &vop_putpages_desc, fifo_putpages }, /* genfs_null_putpages*/
256 #if 0
257 { &vop_openextattr_desc, _openextattr }, /* openextattr */
258 { &vop_closeextattr_desc, _closeextattr }, /* closeextattr */
259 { &vop_getextattr_desc, _getextattr }, /* getextattr */
260 { &vop_setextattr_desc, _setextattr }, /* setextattr */
261 { &vop_listextattr_desc, _listextattr }, /* listextattr */
262 { &vop_deleteextattr_desc, _deleteextattr }, /* deleteextattr */
263 #endif
264 { NULL, NULL }
265 };
266 const struct vnodeopv_desc puffs_fifoop_opv_desc =
267 { &puffs_fifoop_p, puffs_fifoop_entries };
268
269
270 /* "real" vnode operations */
271 int (**puffs_msgop_p)(void *);
272 const struct vnodeopv_entry_desc puffs_msgop_entries[] = {
273 { &vop_default_desc, vn_default_error },
274 { &vop_create_desc, puffs_create }, /* create */
275 { &vop_mknod_desc, puffs_mknod }, /* mknod */
276 { &vop_open_desc, puffs_open }, /* open */
277 { &vop_close_desc, puffs_close }, /* close */
278 { &vop_access_desc, puffs_access }, /* access */
279 { &vop_getattr_desc, puffs_getattr }, /* getattr */
280 { &vop_setattr_desc, puffs_setattr }, /* setattr */
281 { &vop_read_desc, puffs_read }, /* read */
282 { &vop_write_desc, puffs_write }, /* write */
283 { &vop_fcntl_desc, puffs_fcntl }, /* fcntl */
284 { &vop_ioctl_desc, puffs_ioctl }, /* ioctl */
285 { &vop_seek_desc, puffs_seek }, /* seek */
286 { &vop_remove_desc, puffs_remove }, /* remove */
287 { &vop_link_desc, puffs_link }, /* link */
288 { &vop_rename_desc, puffs_rename }, /* rename */
289 { &vop_mkdir_desc, puffs_mkdir }, /* mkdir */
290 { &vop_rmdir_desc, puffs_rmdir }, /* rmdir */
291 { &vop_symlink_desc, puffs_symlink }, /* symlink */
292 { &vop_readdir_desc, puffs_readdir }, /* readdir */
293 { &vop_readlink_desc, puffs_readlink }, /* readlink */
294 { &vop_print_desc, puffs_print }, /* print */
295 { &vop_islocked_desc, puffs_islocked }, /* islocked */
296 { &vop_pathconf_desc, puffs_pathconf }, /* pathconf */
297 { &vop_advlock_desc, puffs_advlock }, /* advlock */
298 { &vop_getpages_desc, puffs_getpages }, /* getpages */
299 { NULL, NULL }
300 };
301 const struct vnodeopv_desc puffs_msgop_opv_desc =
302 { &puffs_msgop_p, puffs_msgop_entries };
303
304
305 #define ERROUT(err) \
306 do { \
307 error = err; \
308 goto out; \
309 } while (/*CONSTCOND*/0)
310
311 /*
312 * This is a generic vnode operation handler. It checks if the necessary
313 * operations for the called vnode operation are implemented by userspace
314 * and either returns a dummy return value or proceeds to call the real
315 * vnode operation from puffs_msgop_v.
316 *
317 * XXX: this should described elsewhere and autogenerated, the complexity
318 * of the vnode operations vectors and their interrelationships is also
319 * getting a bit out of hand. Another problem is that we need this same
320 * information in the fs server code, so keeping the two in sync manually
321 * is not a viable (long term) plan.
322 */
323
324 /* not supported, handle locking protocol */
325 #define CHECKOP_NOTSUPP(op) \
326 case VOP_##op##_DESCOFFSET: \
327 if (pmp->pmp_vnopmask[PUFFS_VN_##op] == 0) \
328 return genfs_eopnotsupp(v); \
329 break
330
331 /* always succeed, no locking */
332 #define CHECKOP_SUCCESS(op) \
333 case VOP_##op##_DESCOFFSET: \
334 if (pmp->pmp_vnopmask[PUFFS_VN_##op] == 0) \
335 return 0; \
336 break
337
338 int
339 puffs_checkop(void *v)
340 {
341 struct vop_generic_args /* {
342 struct vnodeop_desc *a_desc;
343 spooky mystery contents;
344 } */ *ap = v;
345 struct vnodeop_desc *desc = ap->a_desc;
346 struct puffs_mount *pmp;
347 struct vnode *vp;
348 int offset, rv;
349
350 offset = ap->a_desc->vdesc_vp_offsets[0];
351 #ifdef DIAGNOSTIC
352 if (offset == VDESC_NO_OFFSET)
353 panic("puffs_checkop: no vnode, why did you call me?");
354 #endif
355 vp = *VOPARG_OFFSETTO(struct vnode **, offset, ap);
356 pmp = MPTOPUFFSMP(vp->v_mount);
357
358 DPRINTF_VERBOSE(("checkop call %s (%d), vp %p\n",
359 ap->a_desc->vdesc_name, ap->a_desc->vdesc_offset, vp));
360
361 if (!ALLOPS(pmp)) {
362 switch (desc->vdesc_offset) {
363 CHECKOP_NOTSUPP(CREATE);
364 CHECKOP_NOTSUPP(MKNOD);
365 CHECKOP_NOTSUPP(GETATTR);
366 CHECKOP_NOTSUPP(SETATTR);
367 CHECKOP_NOTSUPP(READ);
368 CHECKOP_NOTSUPP(WRITE);
369 CHECKOP_NOTSUPP(FCNTL);
370 CHECKOP_NOTSUPP(IOCTL);
371 CHECKOP_NOTSUPP(REMOVE);
372 CHECKOP_NOTSUPP(LINK);
373 CHECKOP_NOTSUPP(RENAME);
374 CHECKOP_NOTSUPP(MKDIR);
375 CHECKOP_NOTSUPP(RMDIR);
376 CHECKOP_NOTSUPP(SYMLINK);
377 CHECKOP_NOTSUPP(READDIR);
378 CHECKOP_NOTSUPP(READLINK);
379 CHECKOP_NOTSUPP(PRINT);
380 CHECKOP_NOTSUPP(PATHCONF);
381 CHECKOP_NOTSUPP(ADVLOCK);
382
383 CHECKOP_SUCCESS(ACCESS);
384 CHECKOP_SUCCESS(CLOSE);
385 CHECKOP_SUCCESS(SEEK);
386
387 case VOP_GETPAGES_DESCOFFSET:
388 if (!EXISTSOP(pmp, READ))
389 return genfs_eopnotsupp(v);
390 break;
391
392 default:
393 panic("puffs_checkop: unhandled vnop %d",
394 desc->vdesc_offset);
395 }
396 }
397
398 rv = VOCALL(puffs_msgop_p, ap->a_desc->vdesc_offset, v);
399
400 DPRINTF_VERBOSE(("checkop return %s (%d), vp %p: %d\n",
401 ap->a_desc->vdesc_name, ap->a_desc->vdesc_offset, vp, rv));
402
403 return rv;
404 }
405
406
407 int
408 puffs_lookup(void *v)
409 {
410 struct vop_lookup_args /* {
411 const struct vnodeop_desc *a_desc;
412 struct vnode *a_dvp;
413 struct vnode **a_vpp;
414 struct componentname *a_cnp;
415 } */ *ap = v;
416 struct puffs_mount *pmp;
417 struct componentname *cnp;
418 struct vnode *vp, *dvp;
419 struct puffs_node *dpn;
420 int isdot;
421 int error;
422
423 PUFFS_VNREQ(lookup);
424
425 pmp = MPTOPUFFSMP(ap->a_dvp->v_mount);
426 cnp = ap->a_cnp;
427 dvp = ap->a_dvp;
428 *ap->a_vpp = NULL;
429
430 /* first things first: check access */
431 error = VOP_ACCESS(dvp, VEXEC, cnp->cn_cred, cnp->cn_lwp);
432 if (error)
433 return error;
434
435 isdot = cnp->cn_namelen == 1 && *cnp->cn_nameptr == '.';
436
437 DPRINTF(("puffs_lookup: \"%s\", parent vnode %p, op: %lx\n",
438 cnp->cn_nameptr, dvp, cnp->cn_nameiop));
439
440 /*
441 * Check if someone fed it into the cache
442 */
443 if (PUFFS_USE_NAMECACHE(pmp)) {
444 error = cache_lookup(dvp, ap->a_vpp, cnp);
445
446 if (error >= 0)
447 return error;
448 }
449
450 if (isdot) {
451 vp = ap->a_dvp;
452 vref(vp);
453 *ap->a_vpp = vp;
454 return 0;
455 }
456
457 puffs_makecn(&lookup_arg.pvnr_cn, &lookup_arg.pvnr_cn_cred,
458 &lookup_arg.pvnr_cn_cid, cnp);
459
460 if (cnp->cn_flags & ISDOTDOT)
461 VOP_UNLOCK(dvp, 0);
462
463 error = puffs_vntouser(pmp, PUFFS_VN_LOOKUP,
464 &lookup_arg, sizeof(lookup_arg), 0, dvp, NULL);
465 DPRINTF(("puffs_lookup: return of the userspace, part %d\n", error));
466
467 /*
468 * In case of error, there is no new vnode to play with, so be
469 * happy with the NULL value given to vpp in the beginning.
470 * Also, check if this really was an error or the target was not
471 * present. Either treat it as a non-error for CREATE/RENAME or
472 * enter the component into the negative name cache (if desired).
473 */
474 if (error) {
475 if (error == ENOENT) {
476 if ((cnp->cn_flags & ISLASTCN)
477 && (cnp->cn_nameiop == CREATE
478 || cnp->cn_nameiop == RENAME)) {
479 cnp->cn_flags |= SAVENAME;
480 error = EJUSTRETURN;
481 } else {
482 if ((cnp->cn_flags & MAKEENTRY)
483 && PUFFS_USE_NAMECACHE(pmp))
484 cache_enter(dvp, NULL, cnp);
485 }
486 } else if (error < 0) {
487 error = EINVAL;
488 }
489 goto out;
490 }
491
492 /*
493 * Check that we don't get our parent node back, that would cause
494 * a pretty obvious deadlock.
495 */
496 dpn = dvp->v_data;
497 if (lookup_arg.pvnr_newnode == dpn->pn_cookie) {
498 error = EINVAL;
499 goto out;
500 }
501
502 /* XXX: race here */
503 /* XXX2: this check for node existence twice */
504 error = puffs_pnode2vnode(pmp, lookup_arg.pvnr_newnode, 1, &vp);
505 if (error) {
506 error = puffs_getvnode(dvp->v_mount,
507 lookup_arg.pvnr_newnode, lookup_arg.pvnr_vtype,
508 lookup_arg.pvnr_size, lookup_arg.pvnr_rdev, &vp);
509 if (error) {
510 goto out;
511 }
512 vn_lock(vp, LK_EXCLUSIVE | LK_RETRY);
513 }
514 *ap->a_vpp = vp;
515
516 if ((cnp->cn_flags & MAKEENTRY) != 0 && PUFFS_USE_NAMECACHE(pmp))
517 cache_enter(dvp, vp, cnp);
518
519 out:
520 if (cnp->cn_flags & ISDOTDOT)
521 vn_lock(dvp, LK_EXCLUSIVE | LK_RETRY);
522
523 DPRINTF(("puffs_lookup: returning %d %p\n", error, *ap->a_vpp));
524 return error;
525 }
526
527 int
528 puffs_create(void *v)
529 {
530 struct vop_create_args /* {
531 const struct vnodeop_desc *a_desc;
532 struct vnode *a_dvp;
533 struct vnode **a_vpp;
534 struct componentname *a_cnp;
535 struct vattr *a_vap;
536 } */ *ap = v;
537 int error;
538
539 PUFFS_VNREQ(create);
540 DPRINTF(("puffs_create: dvp %p, cnp: %s\n",
541 ap->a_dvp, ap->a_cnp->cn_nameptr));
542
543 puffs_makecn(&create_arg.pvnr_cn, &create_arg.pvnr_cn_cred,
544 &create_arg.pvnr_cn_cid, ap->a_cnp);
545 create_arg.pvnr_va = *ap->a_vap;
546
547 error = puffs_vntouser(MPTOPUFFSMP(ap->a_dvp->v_mount), PUFFS_VN_CREATE,
548 &create_arg, sizeof(create_arg), 0, ap->a_dvp, NULL);
549 if (error)
550 goto out;
551
552 error = puffs_newnode(ap->a_dvp->v_mount, ap->a_dvp, ap->a_vpp,
553 create_arg.pvnr_newnode, ap->a_cnp, ap->a_vap->va_type, 0);
554 /* XXX: in case of error, need to uncommit userspace transaction */
555
556 out:
557 if (error || (ap->a_cnp->cn_flags & SAVESTART) == 0)
558 PNBUF_PUT(ap->a_cnp->cn_pnbuf);
559 vput(ap->a_dvp);
560
561 DPRINTF(("puffs_create: return %d\n", error));
562 return error;
563 }
564
565 int
566 puffs_mknod(void *v)
567 {
568 struct vop_mknod_args /* {
569 const struct vnodeop_desc *a_desc;
570 struct vnode *a_dvp;
571 struct vnode **a_vpp;
572 struct componentname *a_cnp;
573 struct vattr *a_vap;
574 } */ *ap = v;
575 int error;
576
577 PUFFS_VNREQ(mknod);
578
579 puffs_makecn(&mknod_arg.pvnr_cn, &mknod_arg.pvnr_cn_cred,
580 &mknod_arg.pvnr_cn_cid, ap->a_cnp);
581 mknod_arg.pvnr_va = *ap->a_vap;
582
583 error = puffs_vntouser(MPTOPUFFSMP(ap->a_dvp->v_mount), PUFFS_VN_MKNOD,
584 &mknod_arg, sizeof(mknod_arg), 0, ap->a_dvp, NULL);
585 if (error)
586 goto out;
587
588 error = puffs_newnode(ap->a_dvp->v_mount, ap->a_dvp, ap->a_vpp,
589 mknod_arg.pvnr_newnode, ap->a_cnp, ap->a_vap->va_type,
590 ap->a_vap->va_rdev);
591
592 out:
593 if (error || (ap->a_cnp->cn_flags & SAVESTART) == 0)
594 PNBUF_PUT(ap->a_cnp->cn_pnbuf);
595 vput(ap->a_dvp);
596 return error;
597 }
598
599 int
600 puffs_open(void *v)
601 {
602 struct vop_open_args /* {
603 const struct vnodeop_desc *a_desc;
604 struct vnode *a_vp;
605 int a_mode;
606 kauth_cred_t a_cred;
607 struct lwp *a_l;
608 } */ *ap = v;
609 struct vnode *vp = ap->a_vp;
610 struct puffs_mount *pmp = MPTOPUFFSMP(vp->v_mount);
611 int mode = ap->a_mode;
612 int error;
613
614 PUFFS_VNREQ(open);
615 DPRINTF(("puffs_open: vp %p, mode 0x%x\n", vp, mode));
616
617 if (vp->v_type == VREG && mode & FWRITE && !EXISTSOP(pmp, WRITE))
618 ERROUT(EROFS);
619
620 if (!EXISTSOP(pmp, OPEN))
621 ERROUT(0);
622
623 open_arg.pvnr_mode = mode;
624 puffs_credcvt(&open_arg.pvnr_cred, ap->a_cred);
625 puffs_cidcvt(&open_arg.pvnr_cid, ap->a_l);
626
627 error = puffs_vntouser(MPTOPUFFSMP(vp->v_mount), PUFFS_VN_OPEN,
628 &open_arg, sizeof(open_arg), 0, vp, NULL);
629
630 out:
631 DPRINTF(("puffs_open: returning %d\n", error));
632 return error;
633 }
634
635 int
636 puffs_close(void *v)
637 {
638 struct vop_close_args /* {
639 const struct vnodeop_desc *a_desc;
640 struct vnode *a_vp;
641 int a_fflag;
642 kauth_cred_t a_cred;
643 struct lwp *a_l;
644 } */ *ap = v;
645 struct puffs_vnreq_close *close_argp;
646
647 close_argp = malloc(sizeof(struct puffs_vnreq_close),
648 M_PUFFS, M_WAITOK | M_ZERO);
649 close_argp->pvnr_fflag = ap->a_fflag;
650 puffs_credcvt(&close_argp->pvnr_cred, ap->a_cred);
651 puffs_cidcvt(&close_argp->pvnr_cid, ap->a_l);
652
653 puffs_vntouser_faf(MPTOPUFFSMP(ap->a_vp->v_mount), PUFFS_VN_CLOSE,
654 close_argp, sizeof(struct puffs_vnreq_close), ap->a_vp);
655
656 return 0;
657 }
658
659 int
660 puffs_access(void *v)
661 {
662 struct vop_access_args /* {
663 const struct vnodeop_desc *a_desc;
664 struct vnode *a_vp;
665 int a_mode;
666 kauth_cred_t a_cred;
667 struct lwp *a_l;
668 } */ *ap = v;
669 struct vnode *vp = ap->a_vp;
670 struct puffs_mount *pmp = MPTOPUFFSMP(vp->v_mount);
671 int mode = ap->a_mode;
672
673 PUFFS_VNREQ(access);
674
675 if (vp->v_type == VREG && mode & VWRITE && !EXISTSOP(pmp, WRITE))
676 return EROFS;
677
678 if (!EXISTSOP(pmp, ACCESS))
679 return 0;
680
681 access_arg.pvnr_mode = ap->a_mode;
682 puffs_credcvt(&access_arg.pvnr_cred, ap->a_cred);
683 puffs_cidcvt(&access_arg.pvnr_cid, ap->a_l);
684
685 return puffs_vntouser(MPTOPUFFSMP(vp->v_mount), PUFFS_VN_ACCESS,
686 &access_arg, sizeof(access_arg), 0, vp, NULL);
687 }
688
689 int
690 puffs_getattr(void *v)
691 {
692 struct vop_getattr_args /* {
693 const struct vnodeop_desc *a_desc;
694 struct vnode *a_vp;
695 struct vattr *a_vap;
696 kauth_cred_t a_cred;
697 struct lwp *a_l;
698 } */ *ap = v;
699 struct mount *mp;
700 struct vnode *vp;
701 struct vattr *vap, *rvap;
702 struct puffs_node *pn;
703 int error;
704
705 PUFFS_VNREQ(getattr);
706
707 vp = ap->a_vp;
708 mp = vp->v_mount;
709 vap = ap->a_vap;
710
711 vattr_null(&getattr_arg.pvnr_va);
712 puffs_credcvt(&getattr_arg.pvnr_cred, ap->a_cred);
713 puffs_cidcvt(&getattr_arg.pvnr_cid, ap->a_l);
714
715 error = puffs_vntouser(MPTOPUFFSMP(vp->v_mount), PUFFS_VN_GETATTR,
716 &getattr_arg, sizeof(getattr_arg), 0, vp, NULL);
717 if (error)
718 return error;
719
720 rvap = &getattr_arg.pvnr_va;
721 /*
722 * Don't listen to the file server regarding special device
723 * size info, the file server doesn't know anything about them.
724 */
725 if (vp->v_type == VBLK || vp->v_type == VCHR)
726 rvap->va_size = vp->v_size;
727
728 /* Ditto for blocksize (ufs comment: this doesn't belong here) */
729 if (vp->v_type == VBLK)
730 rvap->va_blocksize = BLKDEV_IOSIZE;
731 else if (vp->v_type == VCHR)
732 rvap->va_blocksize = MAXBSIZE;
733
734 (void) memcpy(vap, rvap, sizeof(struct vattr));
735 vap->va_fsid = mp->mnt_stat.f_fsidx.__fsid_val[0];
736
737 pn = VPTOPP(vp);
738 if (pn->pn_stat & PNODE_METACACHE_ATIME)
739 vap->va_atime = pn->pn_mc_atime;
740 if (pn->pn_stat & PNODE_METACACHE_CTIME)
741 vap->va_ctime = pn->pn_mc_ctime;
742 if (pn->pn_stat & PNODE_METACACHE_MTIME)
743 vap->va_mtime = pn->pn_mc_mtime;
744 if (pn->pn_stat & PNODE_METACACHE_SIZE) {
745 vap->va_size = pn->pn_mc_size;
746 } else {
747 if (rvap->va_size != VNOVAL
748 && vp->v_type != VBLK && vp->v_type != VCHR)
749 uvm_vnp_setsize(vp, rvap->va_size);
750 }
751
752 return 0;
753 }
754
755 int
756 puffs_setattr(void *v)
757 {
758 struct vop_getattr_args /* {
759 const struct vnodeop_desc *a_desc;
760 struct vnode *a_vp;
761 struct vattr *a_vap;
762 kauth_cred_t a_cred;
763 struct lwp *a_l;
764 } */ *ap = v;
765 int error;
766 struct vattr *vap = ap->a_vap;
767 struct puffs_node *pn = ap->a_vp->v_data;
768
769 PUFFS_VNREQ(setattr);
770
771 /*
772 * Flush metacache first. If we are called with some explicit
773 * parameters, treat them as information overriding metacache
774 * information.
775 */
776 if (pn->pn_stat & PNODE_METACACHE_MASK) {
777 if ((pn->pn_stat & PNODE_METACACHE_ATIME)
778 && vap->va_atime.tv_sec == VNOVAL)
779 vap->va_atime = pn->pn_mc_atime;
780 if ((pn->pn_stat & PNODE_METACACHE_CTIME)
781 && vap->va_ctime.tv_sec == VNOVAL)
782 vap->va_ctime = pn->pn_mc_ctime;
783 if ((pn->pn_stat & PNODE_METACACHE_MTIME)
784 && vap->va_mtime.tv_sec == VNOVAL)
785 vap->va_mtime = pn->pn_mc_mtime;
786 if ((pn->pn_stat & PNODE_METACACHE_SIZE)
787 && vap->va_size == VNOVAL)
788 vap->va_size = pn->pn_mc_size;
789
790 pn->pn_stat &= ~PNODE_METACACHE_MASK;
791 }
792
793 (void)memcpy(&setattr_arg.pvnr_va, vap, sizeof(struct vattr));
794 puffs_credcvt(&setattr_arg.pvnr_cred, ap->a_cred);
795 puffs_cidcvt(&setattr_arg.pvnr_cid, ap->a_l);
796
797 error = puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount), PUFFS_VN_SETATTR,
798 &setattr_arg, sizeof(setattr_arg), 0, ap->a_vp, NULL);
799 if (error)
800 return error;
801
802 if (vap->va_size != VNOVAL)
803 uvm_vnp_setsize(ap->a_vp, vap->va_size);
804
805 return 0;
806 }
807
808 int
809 puffs_inactive(void *v)
810 {
811 struct vop_inactive_args /* {
812 const struct vnodeop_desc *a_desc;
813 struct vnode *a_vp;
814 struct lwp *a_l;
815 } */ *ap = v;
816 struct puffs_mount *pmp;
817 struct puffs_node *pnode;
818 int rv, vnrefs, call;
819
820 PUFFS_VNREQ(inactive);
821
822 /*
823 * XXX: think about this after we really start unlocking
824 * when going to userspace
825 */
826 pnode = ap->a_vp->v_data;
827
828 pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
829
830 puffs_cidcvt(&inactive_arg.pvnr_cid, ap->a_l);
831
832 if (EXISTSOP(pmp, INACTIVE))
833 if (pmp->pmp_flags & PUFFS_KFLAG_IAONDEMAND)
834 if ((pnode->pn_stat & PNODE_DOINACT) || ALLOPS(pmp))
835 call = 1;
836 else
837 call = 0;
838 else
839 call = 1;
840 else
841 call = 0;
842
843 if (call)
844 rv = puffs_vntouser(pmp, PUFFS_VN_INACTIVE,
845 &inactive_arg, sizeof(inactive_arg), 0, ap->a_vp, NULL);
846 else
847 rv = 1; /* see below */
848 pnode->pn_stat &= ~PNODE_DOINACT;
849
850 /* can't trust userspace return value? simulate safe answer */
851 if (rv)
852 vnrefs = 1;
853 else
854 vnrefs = inactive_arg.pvnr_backendrefs;
855
856 VOP_UNLOCK(ap->a_vp, 0);
857
858 /*
859 * user server thinks it's gone? then don't be afraid care,
860 * node's life was already all it would ever be
861 */
862 if (vnrefs == 0 || (pnode->pn_stat & PNODE_NOREFS)) {
863 pnode->pn_stat |= PNODE_DYING;
864 vrecycle(ap->a_vp, NULL, ap->a_l);
865 }
866
867 return 0;
868 }
869
870 /*
871 * always FAF, we don't really care if the server wants to fail to
872 * reclaim the node or not
873 */
874 int
875 puffs_reclaim(void *v)
876 {
877 struct vop_reclaim_args /* {
878 const struct vnodeop_desc *a_desc;
879 struct vnode *a_vp;
880 struct lwp *a_l;
881 } */ *ap = v;
882 struct puffs_mount *pmp;
883 struct puffs_vnreq_reclaim *reclaim_argp;
884
885 pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
886
887 /*
888 * first things first: check if someone is trying to reclaim the
889 * root vnode. do not allow that to travel to userspace.
890 * Note that we don't need to take the lock similarly to
891 * puffs_root(), since there is only one of us.
892 */
893 if (ap->a_vp->v_flag & VROOT) {
894 mutex_enter(&pmp->pmp_lock);
895 KASSERT(pmp->pmp_root != NULL);
896 pmp->pmp_root = NULL;
897 mutex_exit(&pmp->pmp_lock);
898 goto out;
899 }
900
901 if (!EXISTSOP(pmp, RECLAIM))
902 goto out;
903
904 reclaim_argp = malloc(sizeof(struct puffs_vnreq_reclaim),
905 M_PUFFS, M_WAITOK | M_ZERO);
906 puffs_cidcvt(&reclaim_argp->pvnr_cid, ap->a_l);
907
908 puffs_vntouser_faf(pmp, PUFFS_VN_RECLAIM,
909 reclaim_argp, sizeof(struct puffs_vnreq_reclaim), ap->a_vp);
910
911 out:
912 if (PUFFS_USE_NAMECACHE(pmp))
913 cache_purge(ap->a_vp);
914 puffs_putvnode(ap->a_vp);
915
916 return 0;
917 }
918
919 #define CSIZE sizeof(**ap->a_cookies)
920 int
921 puffs_readdir(void *v)
922 {
923 struct vop_readdir_args /* {
924 const struct vnodeop_desc *a_desc;
925 struct vnode *a_vp;
926 struct uio *a_uio;
927 kauth_cred_t a_cred;
928 int *a_eofflag;
929 off_t **a_cookies;
930 int *a_ncookies;
931 } */ *ap = v;
932 struct puffs_mount *pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
933 struct puffs_vnreq_readdir *readdir_argp;
934 size_t argsize, tomove, cookiemem, cookiesmax;
935 struct uio *uio = ap->a_uio;
936 size_t howmuch;
937 int error;
938
939 if (ap->a_cookies) {
940 KASSERT(ap->a_ncookies != NULL);
941 if (pmp->pmp_args.pa_fhsize == 0)
942 return EOPNOTSUPP;
943 cookiesmax = uio->uio_resid/_DIRENT_MINSIZE((struct dirent *)0);
944 cookiemem = ALIGN(cookiesmax*CSIZE); /* play safe */
945 } else {
946 cookiesmax = 0;
947 cookiemem = 0;
948 }
949
950 argsize = sizeof(struct puffs_vnreq_readdir);
951 tomove = uio->uio_resid + cookiemem;
952 readdir_argp = malloc(argsize + tomove, M_PUFFS, M_ZERO | M_WAITOK);
953
954 puffs_credcvt(&readdir_argp->pvnr_cred, ap->a_cred);
955 readdir_argp->pvnr_offset = uio->uio_offset;
956 readdir_argp->pvnr_resid = uio->uio_resid;
957 readdir_argp->pvnr_ncookies = cookiesmax;
958 readdir_argp->pvnr_eofflag = 0;
959 readdir_argp->pvnr_dentoff = cookiemem;
960
961 error = puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount),
962 PUFFS_VN_READDIR, readdir_argp, argsize, tomove,
963 ap->a_vp, NULL);
964 if (error)
965 goto out;
966
967 /* userspace is cheating? */
968 if (readdir_argp->pvnr_resid > uio->uio_resid
969 || readdir_argp->pvnr_ncookies > cookiesmax)
970 ERROUT(EINVAL);
971
972 /* check eof */
973 if (readdir_argp->pvnr_eofflag)
974 *ap->a_eofflag = 1;
975
976 /* bouncy-wouncy with the directory data */
977 howmuch = uio->uio_resid - readdir_argp->pvnr_resid;
978
979 /* force eof if no data was returned (getcwd() needs this) */
980 if (howmuch == 0) {
981 *ap->a_eofflag = 1;
982 goto out;
983 }
984
985 error = uiomove(readdir_argp->pvnr_data + cookiemem, howmuch, uio);
986 if (error)
987 goto out;
988
989 /* provide cookies to caller if so desired */
990 if (ap->a_cookies) {
991 *ap->a_cookies = malloc(readdir_argp->pvnr_ncookies*CSIZE,
992 M_TEMP, M_WAITOK);
993 *ap->a_ncookies = readdir_argp->pvnr_ncookies;
994 memcpy(*ap->a_cookies, readdir_argp->pvnr_data,
995 *ap->a_ncookies*CSIZE);
996 }
997
998 /* next readdir starts here */
999 uio->uio_offset = readdir_argp->pvnr_offset;
1000
1001 out:
1002 free(readdir_argp, M_PUFFS);
1003 return error;
1004 }
1005 #undef CSIZE
1006
1007 /*
1008 * poll works by consuming the bitmask in pn_revents. If there are
1009 * events available, poll returns immediately. If not, it issues a
1010 * poll to userspace, selrecords itself and returns with no available
1011 * events. When the file server returns, it executes puffs_parkdone_poll(),
1012 * where available events are added to the bitmask. selnotify() is
1013 * then also executed by that function causing us to enter here again
1014 * and hopefully find the missing bits (unless someone got them first,
1015 * in which case it starts all over again).
1016 */
1017 int
1018 puffs_poll(void *v)
1019 {
1020 struct vop_poll_args /* {
1021 const struct vnodeop_desc *a_desc;
1022 struct vnode *a_vp;
1023 int a_events;
1024 struct lwp *a_l;
1025 }*/ *ap = v;
1026 struct vnode *vp = ap->a_vp;
1027 struct puffs_mount *pmp = MPTOPUFFSMP(vp->v_mount);
1028 struct puffs_vnreq_poll *poll_argp;
1029 struct puffs_node *pn = vp->v_data;
1030 int events;
1031
1032 if (EXISTSOP(pmp, POLL)) {
1033 mutex_enter(&pn->pn_mtx);
1034 events = pn->pn_revents & ap->a_events;
1035 if (events & ap->a_events) {
1036 pn->pn_revents &= ~ap->a_events;
1037 mutex_exit(&pn->pn_mtx);
1038
1039 return events;
1040 } else {
1041 puffs_referencenode(pn);
1042 mutex_exit(&pn->pn_mtx);
1043
1044 /* freed in puffs_parkdone_poll */
1045 poll_argp = malloc(sizeof(struct puffs_vnreq_poll),
1046 M_PUFFS, M_ZERO | M_WAITOK);
1047
1048 poll_argp->pvnr_events = ap->a_events;
1049 puffs_cidcvt(&poll_argp->pvnr_cid, ap->a_l);
1050
1051 selrecord(ap->a_l, &pn->pn_sel);
1052 puffs_vntouser_call(pmp, PUFFS_VN_POLL,
1053 poll_argp, sizeof(struct puffs_vnreq_poll), 0,
1054 puffs_parkdone_poll, pn,
1055 vp, NULL);
1056
1057 return 0;
1058 }
1059 } else {
1060 return genfs_poll(v);
1061 }
1062 }
1063
1064 int
1065 puffs_fsync(void *v)
1066 {
1067 struct vop_fsync_args /* {
1068 const struct vnodeop_desc *a_desc;
1069 struct vnode *a_vp;
1070 kauth_cred_t a_cred;
1071 int a_flags;
1072 off_t a_offlo;
1073 off_t a_offhi;
1074 struct lwp *a_l;
1075 } */ *ap = v;
1076 struct vattr va;
1077 struct puffs_mount *pmp;
1078 struct puffs_vnreq_fsync *fsync_argp;
1079 struct vnode *vp;
1080 struct puffs_node *pn;
1081 int pflags, error, dofaf;
1082
1083 PUFFS_VNREQ(fsync);
1084
1085 vp = ap->a_vp;
1086 pn = VPTOPP(vp);
1087 pmp = MPTOPUFFSMP(vp->v_mount);
1088
1089 /* flush out information from our metacache, see vop_setattr */
1090 if (pn->pn_stat & PNODE_METACACHE_MASK
1091 && (pn->pn_stat & PNODE_DYING) == 0) {
1092 vattr_null(&va);
1093 error = VOP_SETATTR(vp, &va, FSCRED, NULL);
1094 if (error)
1095 return error;
1096 }
1097
1098 /*
1099 * flush pages to avoid being overly dirty
1100 */
1101 pflags = PGO_CLEANIT;
1102 if (ap->a_flags & FSYNC_WAIT)
1103 pflags |= PGO_SYNCIO;
1104 simple_lock(&vp->v_interlock);
1105 error = VOP_PUTPAGES(vp, trunc_page(ap->a_offlo),
1106 round_page(ap->a_offhi), pflags);
1107 if (error)
1108 return error;
1109
1110 /*
1111 * HELLO! We exit already here if the user server does not
1112 * support fsync OR if we should call fsync for a node which
1113 * has references neither in the kernel or the fs server.
1114 * Otherwise we continue to issue fsync() forward.
1115 */
1116 if (!EXISTSOP(pmp, FSYNC) || (pn->pn_stat & PNODE_DYING))
1117 return 0;
1118
1119 dofaf = (ap->a_flags & FSYNC_WAIT) == 0 || ap->a_flags == FSYNC_LAZY;
1120 /*
1121 * We abuse VXLOCK to mean "vnode is going to die", so we issue
1122 * only FAFs for those. Otherwise there's a danger of deadlock,
1123 * since the execution context here might be the user server
1124 * doing some operation on another fs, which in turn caused a
1125 * vnode to be reclaimed from the freelist for this fs.
1126 */
1127 if (dofaf == 0) {
1128 simple_lock(&vp->v_interlock);
1129 if (vp->v_flag & VXLOCK)
1130 dofaf = 1;
1131 simple_unlock(&vp->v_interlock);
1132 }
1133
1134 if (dofaf == 0) {
1135 fsync_argp = &fsync_arg;
1136 } else {
1137 fsync_argp = malloc(sizeof(struct puffs_vnreq_fsync),
1138 M_PUFFS, M_ZERO | M_NOWAIT);
1139 if (fsync_argp == NULL)
1140 return ENOMEM;
1141 }
1142
1143 puffs_credcvt(&fsync_argp->pvnr_cred, ap->a_cred);
1144 fsync_argp->pvnr_flags = ap->a_flags;
1145 fsync_argp->pvnr_offlo = ap->a_offlo;
1146 fsync_argp->pvnr_offhi = ap->a_offhi;
1147 puffs_cidcvt(&fsync_argp->pvnr_cid, ap->a_l);
1148
1149 /*
1150 * XXX: see comment at puffs_getattr about locking
1151 *
1152 * If we are not required to wait, do a FAF operation.
1153 * Otherwise block here.
1154 */
1155 if (dofaf == 0) {
1156 error = puffs_vntouser(MPTOPUFFSMP(vp->v_mount),
1157 PUFFS_VN_FSYNC, fsync_argp, sizeof(*fsync_argp), 0,
1158 vp, NULL);
1159 } else {
1160 /* FAF is always "succesful" */
1161 error = 0;
1162 puffs_vntouser_faf(MPTOPUFFSMP(vp->v_mount),
1163 PUFFS_VN_FSYNC, fsync_argp, sizeof(*fsync_argp), vp);
1164 }
1165
1166 return error;
1167 }
1168
1169 int
1170 puffs_seek(void *v)
1171 {
1172 struct vop_seek_args /* {
1173 const struct vnodeop_desc *a_desc;
1174 struct vnode *a_vp;
1175 off_t a_oldoff;
1176 off_t a_newoff;
1177 kauth_cred_t a_cred;
1178 } */ *ap = v;
1179
1180 PUFFS_VNREQ(seek);
1181
1182 seek_arg.pvnr_oldoff = ap->a_oldoff;
1183 seek_arg.pvnr_newoff = ap->a_newoff;
1184 puffs_credcvt(&seek_arg.pvnr_cred, ap->a_cred);
1185
1186 /*
1187 * XXX: seems like seek is called with an unlocked vp, but
1188 * it can't hurt to play safe
1189 */
1190 return puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount), PUFFS_VN_SEEK,
1191 &seek_arg, sizeof(seek_arg), 0, ap->a_vp, NULL);
1192 }
1193
1194 int
1195 puffs_remove(void *v)
1196 {
1197 struct vop_remove_args /* {
1198 const struct vnodeop_desc *a_desc;
1199 struct vnode *a_dvp;
1200 struct vnode *a_vp;
1201 struct componentname *a_cnp;
1202 } */ *ap = v;
1203 int error;
1204
1205 PUFFS_VNREQ(remove);
1206
1207 remove_arg.pvnr_cookie_targ = VPTOPNC(ap->a_vp);
1208 puffs_makecn(&remove_arg.pvnr_cn, &remove_arg.pvnr_cn_cred,
1209 &remove_arg.pvnr_cn_cid, ap->a_cnp);
1210
1211 error = puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount), PUFFS_VN_REMOVE,
1212 &remove_arg, sizeof(remove_arg), 0, ap->a_dvp, ap->a_vp);
1213
1214 vput(ap->a_vp);
1215 if (ap->a_dvp == ap->a_vp)
1216 vrele(ap->a_dvp);
1217 else
1218 vput(ap->a_dvp);
1219
1220 return error;
1221 }
1222
1223 int
1224 puffs_mkdir(void *v)
1225 {
1226 struct vop_mkdir_args /* {
1227 const struct vnodeop_desc *a_desc;
1228 struct vnode *a_dvp;
1229 struct vnode **a_vpp;
1230 struct componentname *a_cnp;
1231 struct vattr *a_vap;
1232 } */ *ap = v;
1233 int error;
1234
1235 PUFFS_VNREQ(mkdir);
1236
1237 puffs_makecn(&mkdir_arg.pvnr_cn, &mkdir_arg.pvnr_cn_cred,
1238 &mkdir_arg.pvnr_cn_cid, ap->a_cnp);
1239 mkdir_arg.pvnr_va = *ap->a_vap;
1240
1241 error = puffs_vntouser(MPTOPUFFSMP(ap->a_dvp->v_mount), PUFFS_VN_MKDIR,
1242 &mkdir_arg, sizeof(mkdir_arg), 0, ap->a_dvp, NULL);
1243 if (error)
1244 goto out;
1245
1246 error = puffs_newnode(ap->a_dvp->v_mount, ap->a_dvp, ap->a_vpp,
1247 mkdir_arg.pvnr_newnode, ap->a_cnp, VDIR, 0);
1248
1249 out:
1250 if (error || (ap->a_cnp->cn_flags & SAVESTART) == 0)
1251 PNBUF_PUT(ap->a_cnp->cn_pnbuf);
1252 vput(ap->a_dvp);
1253 return error;
1254 }
1255
1256 int
1257 puffs_rmdir(void *v)
1258 {
1259 struct vop_rmdir_args /* {
1260 const struct vnodeop_desc *a_desc;
1261 struct vnode *a_dvp;
1262 struct vnode *a_vp;
1263 struct componentname *a_cnp;
1264 } */ *ap = v;
1265 int error;
1266
1267 PUFFS_VNREQ(rmdir);
1268
1269 rmdir_arg.pvnr_cookie_targ = VPTOPNC(ap->a_vp);
1270 puffs_makecn(&rmdir_arg.pvnr_cn, &rmdir_arg.pvnr_cn_cred,
1271 &rmdir_arg.pvnr_cn_cid, ap->a_cnp);
1272
1273 error = puffs_vntouser(MPTOPUFFSMP(ap->a_dvp->v_mount), PUFFS_VN_RMDIR,
1274 &rmdir_arg, sizeof(rmdir_arg), 0, ap->a_dvp, ap->a_vp);
1275
1276 /* XXX: some call cache_purge() *for both vnodes* here, investigate */
1277
1278 vput(ap->a_dvp);
1279 vput(ap->a_vp);
1280
1281 return error;
1282 }
1283
1284 int
1285 puffs_link(void *v)
1286 {
1287 struct vop_link_args /* {
1288 const struct vnodeop_desc *a_desc;
1289 struct vnode *a_dvp;
1290 struct vnode *a_vp;
1291 struct componentname *a_cnp;
1292 }*/ *ap = v;
1293 int error;
1294
1295 PUFFS_VNREQ(link);
1296
1297 link_arg.pvnr_cookie_targ = VPTOPNC(ap->a_vp);
1298 puffs_makecn(&link_arg.pvnr_cn, &link_arg.pvnr_cn_cred,
1299 &link_arg.pvnr_cn_cid, ap->a_cnp);
1300
1301 error = puffs_vntouser(MPTOPUFFSMP(ap->a_dvp->v_mount), PUFFS_VN_LINK,
1302 &link_arg, sizeof(link_arg), 0, ap->a_dvp, ap->a_vp);
1303
1304 /*
1305 * XXX: stay in touch with the cache. I don't like this, but
1306 * don't have a better solution either. See also puffs_rename().
1307 */
1308 if (error == 0)
1309 puffs_updatenode(ap->a_vp, PUFFS_UPDATECTIME);
1310
1311 vput(ap->a_dvp);
1312
1313 return error;
1314 }
1315
1316 int
1317 puffs_symlink(void *v)
1318 {
1319 struct vop_symlink_args /* {
1320 const struct vnodeop_desc *a_desc;
1321 struct vnode *a_dvp;
1322 struct vnode **a_vpp;
1323 struct componentname *a_cnp;
1324 struct vattr *a_vap;
1325 char *a_target;
1326 }*/ *ap = v;
1327 struct puffs_vnreq_symlink *symlink_argp;
1328 int error;
1329
1330 *ap->a_vpp = NULL;
1331
1332 symlink_argp = malloc(sizeof(struct puffs_vnreq_symlink),
1333 M_PUFFS, M_ZERO | M_WAITOK);
1334 puffs_makecn(&symlink_argp->pvnr_cn, &symlink_argp->pvnr_cn_cred,
1335 &symlink_argp->pvnr_cn_cid, ap->a_cnp);
1336 symlink_argp->pvnr_va = *ap->a_vap;
1337 (void)strlcpy(symlink_argp->pvnr_link, ap->a_target,
1338 sizeof(symlink_argp->pvnr_link));
1339
1340 error = puffs_vntouser(MPTOPUFFSMP(ap->a_dvp->v_mount),
1341 PUFFS_VN_SYMLINK, symlink_argp, sizeof(*symlink_argp), 0,
1342 ap->a_dvp, NULL);
1343 if (error)
1344 goto out;
1345
1346 error = puffs_newnode(ap->a_dvp->v_mount, ap->a_dvp, ap->a_vpp,
1347 symlink_argp->pvnr_newnode, ap->a_cnp, VLNK, 0);
1348
1349 out:
1350 free(symlink_argp, M_PUFFS);
1351 if (error || (ap->a_cnp->cn_flags & SAVESTART) == 0)
1352 PNBUF_PUT(ap->a_cnp->cn_pnbuf);
1353 vput(ap->a_dvp);
1354
1355 return error;
1356 }
1357
1358 int
1359 puffs_readlink(void *v)
1360 {
1361 struct vop_readlink_args /* {
1362 const struct vnodeop_desc *a_desc;
1363 struct vnode *a_vp;
1364 struct uio *a_uio;
1365 kauth_cred_t a_cred;
1366 } */ *ap = v;
1367 size_t linklen;
1368 int error;
1369
1370 PUFFS_VNREQ(readlink);
1371
1372 puffs_credcvt(&readlink_arg.pvnr_cred, ap->a_cred);
1373 linklen = sizeof(readlink_arg.pvnr_link);
1374 readlink_arg.pvnr_linklen = linklen;
1375
1376 error = puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount),
1377 PUFFS_VN_READLINK, &readlink_arg, sizeof(readlink_arg), 0,
1378 ap->a_vp, NULL);
1379 if (error)
1380 return error;
1381
1382 /* bad bad user file server */
1383 if (readlink_arg.pvnr_linklen > linklen)
1384 return EINVAL;
1385
1386 return uiomove(&readlink_arg.pvnr_link, readlink_arg.pvnr_linklen,
1387 ap->a_uio);
1388 }
1389
1390 int
1391 puffs_rename(void *v)
1392 {
1393 struct vop_rename_args /* {
1394 const struct vnodeop_desc *a_desc;
1395 struct vnode *a_fdvp;
1396 struct vnode *a_fvp;
1397 struct componentname *a_fcnp;
1398 struct vnode *a_tdvp;
1399 struct vnode *a_tvp;
1400 struct componentname *a_tcnp;
1401 }*/ *ap = v;
1402 struct puffs_vnreq_rename *rename_argp = NULL;
1403 int error;
1404
1405 if (ap->a_fvp->v_mount != ap->a_tdvp->v_mount)
1406 ERROUT(EXDEV);
1407
1408 rename_argp = malloc(sizeof(struct puffs_vnreq_rename),
1409 M_PUFFS, M_WAITOK | M_ZERO);
1410
1411 rename_argp->pvnr_cookie_src = VPTOPNC(ap->a_fvp);
1412 rename_argp->pvnr_cookie_targdir = VPTOPNC(ap->a_tdvp);
1413 if (ap->a_tvp)
1414 rename_argp->pvnr_cookie_targ = VPTOPNC(ap->a_tvp);
1415 else
1416 rename_argp->pvnr_cookie_targ = NULL;
1417 puffs_makecn(&rename_argp->pvnr_cn_src,
1418 &rename_argp->pvnr_cn_src_cred, &rename_argp->pvnr_cn_src_cid,
1419 ap->a_fcnp);
1420 puffs_makecn(&rename_argp->pvnr_cn_targ,
1421 &rename_argp->pvnr_cn_targ_cred, &rename_argp->pvnr_cn_targ_cid,
1422 ap->a_tcnp);
1423
1424 error = puffs_vntouser(MPTOPUFFSMP(ap->a_fdvp->v_mount),
1425 PUFFS_VN_RENAME, rename_argp, sizeof(*rename_argp), 0,
1426 ap->a_fdvp, NULL); /* XXX */
1427
1428 /*
1429 * XXX: stay in touch with the cache. I don't like this, but
1430 * don't have a better solution either. See also puffs_link().
1431 */
1432 if (error == 0)
1433 puffs_updatenode(ap->a_fvp, PUFFS_UPDATECTIME);
1434
1435 out:
1436 if (rename_argp)
1437 free(rename_argp, M_PUFFS);
1438 if (ap->a_tvp != NULL)
1439 vput(ap->a_tvp);
1440 if (ap->a_tdvp == ap->a_tvp)
1441 vrele(ap->a_tdvp);
1442 else
1443 vput(ap->a_tdvp);
1444
1445 vrele(ap->a_fdvp);
1446 vrele(ap->a_fvp);
1447
1448 return error;
1449 }
1450
1451 #define RWARGS(cont, iofl, move, offset, creds) \
1452 (cont)->pvnr_ioflag = (iofl); \
1453 (cont)->pvnr_resid = (move); \
1454 (cont)->pvnr_offset = (offset); \
1455 puffs_credcvt(&(cont)->pvnr_cred, creds)
1456
1457 int
1458 puffs_read(void *v)
1459 {
1460 struct vop_read_args /* {
1461 const struct vnodeop_desc *a_desc;
1462 struct vnode *a_vp;
1463 struct uio *a_uio;
1464 int a_ioflag;
1465 kauth_cred_t a_cred;
1466 } */ *ap = v;
1467 struct puffs_vnreq_read *read_argp;
1468 struct puffs_mount *pmp;
1469 struct vnode *vp;
1470 struct uio *uio;
1471 void *win;
1472 size_t tomove, argsize;
1473 vsize_t bytelen;
1474 int error, ubcflags;
1475
1476 uio = ap->a_uio;
1477 vp = ap->a_vp;
1478 read_argp = NULL;
1479 error = 0;
1480 pmp = MPTOPUFFSMP(vp->v_mount);
1481
1482 /* std sanity */
1483 if (uio->uio_resid == 0)
1484 return 0;
1485 if (uio->uio_offset < 0)
1486 return EINVAL;
1487
1488 if (vp->v_type == VREG && PUFFS_USE_PAGECACHE(pmp)) {
1489 const int advice = IO_ADV_DECODE(ap->a_ioflag);
1490
1491 ubcflags = 0;
1492 if (UBC_WANT_UNMAP(vp))
1493 ubcflags = UBC_UNMAP;
1494
1495 while (uio->uio_resid > 0) {
1496 bytelen = MIN(uio->uio_resid,
1497 vp->v_size - uio->uio_offset);
1498 if (bytelen == 0)
1499 break;
1500
1501 win = ubc_alloc(&vp->v_uobj, uio->uio_offset,
1502 &bytelen, advice, UBC_READ);
1503 error = uiomove(win, bytelen, uio);
1504 ubc_release(win, ubcflags);
1505 if (error)
1506 break;
1507 }
1508
1509 if ((vp->v_mount->mnt_flag & MNT_NOATIME) == 0)
1510 puffs_updatenode(vp, PUFFS_UPDATEATIME);
1511 } else {
1512 /*
1513 * in case it's not a regular file or we're operating
1514 * uncached, do read in the old-fashioned style,
1515 * i.e. explicit read operations
1516 */
1517
1518 tomove = PUFFS_TOMOVE(uio->uio_resid, pmp);
1519 argsize = sizeof(struct puffs_vnreq_read);
1520 read_argp = malloc(argsize + tomove,
1521 M_PUFFS, M_WAITOK | M_ZERO);
1522
1523 error = 0;
1524 while (uio->uio_resid > 0) {
1525 tomove = PUFFS_TOMOVE(uio->uio_resid, pmp);
1526 RWARGS(read_argp, ap->a_ioflag, tomove,
1527 uio->uio_offset, ap->a_cred);
1528
1529 error = puffs_vntouser(pmp, PUFFS_VN_READ,
1530 read_argp, argsize, tomove,
1531 ap->a_vp, NULL);
1532 if (error)
1533 break;
1534
1535 if (read_argp->pvnr_resid > tomove) {
1536 error = EINVAL;
1537 break;
1538 }
1539
1540 error = uiomove(read_argp->pvnr_data,
1541 tomove - read_argp->pvnr_resid, uio);
1542
1543 /*
1544 * in case the file is out of juice, resid from
1545 * userspace is != 0. and the error-case is
1546 * quite obvious
1547 */
1548 if (error || read_argp->pvnr_resid)
1549 break;
1550 }
1551 }
1552
1553 if (read_argp)
1554 free(read_argp, M_PUFFS);
1555 return error;
1556 }
1557
1558 /*
1559 * XXX: in case of a failure, this leaves uio in a bad state.
1560 * We could theoretically copy the uio and iovecs and "replay"
1561 * them the right amount after the userspace trip, but don't
1562 * bother for now.
1563 */
1564 int
1565 puffs_write(void *v)
1566 {
1567 struct vop_write_args /* {
1568 const struct vnodeop_desc *a_desc;
1569 struct vnode *a_vp;
1570 struct uio *a_uio;
1571 int a_ioflag;
1572 kauth_cred_t a_cred;
1573 } */ *ap = v;
1574 struct puffs_vnreq_write *write_argp;
1575 struct puffs_mount *pmp;
1576 struct uio *uio;
1577 struct vnode *vp;
1578 size_t tomove, argsize;
1579 off_t oldoff, newoff, origoff;
1580 vsize_t bytelen;
1581 int error, uflags;
1582 int ubcflags;
1583
1584 vp = ap->a_vp;
1585 uio = ap->a_uio;
1586 error = uflags = 0;
1587 write_argp = NULL;
1588 pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
1589
1590 if (vp->v_type == VREG && PUFFS_USE_PAGECACHE(pmp)) {
1591 ubcflags = UBC_WRITE | UBC_PARTIALOK;
1592 if (UBC_WANT_UNMAP(vp))
1593 ubcflags = UBC_UNMAP;
1594
1595 /*
1596 * userspace *should* be allowed to control this,
1597 * but with UBC it's a bit unclear how to handle it
1598 */
1599 if (ap->a_ioflag & IO_APPEND)
1600 uio->uio_offset = vp->v_size;
1601
1602 origoff = uio->uio_offset;
1603 while (uio->uio_resid > 0) {
1604 uflags |= PUFFS_UPDATECTIME;
1605 uflags |= PUFFS_UPDATEMTIME;
1606 oldoff = uio->uio_offset;
1607 bytelen = uio->uio_resid;
1608
1609 newoff = oldoff + bytelen;
1610 if (vp->v_size < newoff) {
1611 uvm_vnp_setwritesize(vp, newoff);
1612 }
1613 error = ubc_uiomove(&vp->v_uobj, uio, bytelen,
1614 ubcflags);
1615
1616 /*
1617 * In case of a ubc_uiomove() error,
1618 * opt to not extend the file at all and
1619 * return an error. Otherwise, if we attempt
1620 * to clear the memory we couldn't fault to,
1621 * we might generate a kernel page fault.
1622 */
1623 if (vp->v_size < newoff) {
1624 if (error == 0) {
1625 uflags |= PUFFS_UPDATESIZE;
1626 uvm_vnp_setsize(vp, newoff);
1627 } else {
1628 uvm_vnp_setwritesize(vp, vp->v_size);
1629 }
1630 }
1631 if (error)
1632 break;
1633
1634 /*
1635 * If we're writing large files, flush to file server
1636 * every 64k. Otherwise we can very easily exhaust
1637 * kernel and user memory, as the file server cannot
1638 * really keep up with our writing speed.
1639 *
1640 * Note: this does *NOT* honor MNT_ASYNC, because
1641 * that gives userland too much say in the kernel.
1642 */
1643 if (oldoff >> 16 != uio->uio_offset >> 16) {
1644 simple_lock(&vp->v_interlock);
1645 error = VOP_PUTPAGES(vp, oldoff & ~0xffff,
1646 uio->uio_offset & ~0xffff,
1647 PGO_CLEANIT | PGO_SYNCIO);
1648 if (error)
1649 break;
1650 }
1651 }
1652
1653 /* synchronous I/O? */
1654 if (error == 0 && ap->a_ioflag & IO_SYNC) {
1655 simple_lock(&vp->v_interlock);
1656 error = VOP_PUTPAGES(vp, trunc_page(origoff),
1657 round_page(uio->uio_offset),
1658 PGO_CLEANIT | PGO_SYNCIO);
1659
1660 /* write though page cache? */
1661 } else if (error == 0 && pmp->pmp_flags & PUFFS_KFLAG_WTCACHE) {
1662 simple_lock(&vp->v_interlock);
1663 error = VOP_PUTPAGES(vp, trunc_page(origoff),
1664 round_page(uio->uio_offset), PGO_CLEANIT);
1665 }
1666
1667 puffs_updatenode(vp, uflags);
1668 } else {
1669 /* tomove is non-increasing */
1670 tomove = PUFFS_TOMOVE(uio->uio_resid, pmp);
1671 argsize = sizeof(struct puffs_vnreq_write) + tomove;
1672 write_argp = malloc(argsize, M_PUFFS, M_WAITOK | M_ZERO);
1673
1674 while (uio->uio_resid > 0) {
1675 /* move data to buffer */
1676 tomove = PUFFS_TOMOVE(uio->uio_resid, pmp);
1677 RWARGS(write_argp, ap->a_ioflag, tomove,
1678 uio->uio_offset, ap->a_cred);
1679 error = uiomove(write_argp->pvnr_data, tomove, uio);
1680 if (error)
1681 break;
1682
1683 /* move buffer to userspace */
1684 error = puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount),
1685 PUFFS_VN_WRITE, write_argp, argsize, 0,
1686 ap->a_vp, NULL);
1687 if (error)
1688 break;
1689
1690 if (write_argp->pvnr_resid > tomove) {
1691 error = EINVAL;
1692 break;
1693 }
1694
1695 /* adjust file size */
1696 if (vp->v_size < uio->uio_offset)
1697 uvm_vnp_setsize(vp, uio->uio_offset);
1698
1699 /* didn't move everything? bad userspace. bail */
1700 if (write_argp->pvnr_resid != 0) {
1701 error = EIO;
1702 break;
1703 }
1704 }
1705 }
1706
1707 if (write_argp)
1708 free(write_argp, M_PUFFS);
1709 return error;
1710 }
1711
1712 static int puffs_fcnioctl(struct vop_ioctl_args * /*XXX*/, int);
1713
1714 #define FCNIOCTL_ARG_MAX 1<<16
1715 int
1716 puffs_fcnioctl(struct vop_ioctl_args *ap, int puffsop)
1717 {
1718
1719 /* currently not supported */
1720 return EOPNOTSUPP;
1721 #if 0
1722 /* struct vop_ioctl_args {
1723 const struct vnodeop_desc *a_desc;
1724 struct vnode *a_vp;
1725 u_long a_command;
1726 void *a_data;
1727 int a_fflag;
1728 kauth_cred_t a_cred;
1729 struct lwp *a_l;
1730 }*ap = v; */
1731 struct puffs_mount *pmp;
1732 struct puffs_sizepark pspark;
1733 void *kernbuf;
1734 size_t copylen;
1735 int error;
1736
1737 PUFFS_VNREQ(fcnioctl);
1738
1739 /*
1740 * Since this op gives the filesystem (almost) complete control on
1741 * how much it is allowed to copy from the calling process
1742 * address space, do not enable it by default, since it would
1743 * be a whopping security hole.
1744 */
1745 pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
1746 if ((pmp->pmp_flags & PUFFS_KFLAG_ALLOWCTL) == 0)
1747 return EINVAL; /* only shoe that fits */
1748
1749 /* fill in sizereq and store it */
1750 pspark.pkso_reqid = puffs_getreqid(pmp);
1751 pspark.pkso_reqtype = PUFFS_SIZEOPREQ_BUF_IN;
1752 pspark.pkso_copybuf = ap->a_data;
1753 pspark.pkso_bufsize = FCNIOCTL_ARG_MAX;
1754 TAILQ_INSERT_TAIL(&pmp->pmp_req_sizepark, &pspark, pkso_entries);
1755
1756 /* then fill in actual request and shoot it off */
1757 fcnioctl_arg.pvnr_command = ap->a_command;
1758 fcnioctl_arg.pvnr_fflag = ap->a_fflag;
1759 puffs_credcvt(&fcnioctl_arg.pvnr_cred, ap->a_cred);
1760 fcnioctl_arg.pvnr_pid = puffs_lwp2pid(ap->a_l);
1761
1762 error = puffs_vntouser_req(MPTOPUFFSMP(ap->a_vp->v_mount), puffsop,
1763 &fcnioctl_arg, sizeof(fcnioctl_arg), 0, ap->a_vp,
1764 pspark.pkso_reqid, ap->a_vp, NULL);
1765
1766 /* if we don't need to copy data, we're done */
1767 if (error || !fcnioctl_arg.pvnr_copyback)
1768 return error;
1769
1770 copylen = MIN(FCNIOCTL_ARG_MAX, fcnioctl_arg.pvnr_datalen);
1771 kernbuf = malloc(copylen, M_PUFFS, M_WAITOK);
1772 error = copyin(fcnioctl_arg.pvnr_data, kernbuf, copylen);
1773 if (error)
1774 goto out;
1775 error = copyout(kernbuf, ap->a_data, copylen);
1776
1777 out:
1778 free(kernbuf, M_PUFFS);
1779 return error;
1780 #endif
1781 }
1782
1783 int
1784 puffs_ioctl(void *v)
1785 {
1786
1787 return puffs_fcnioctl(v, PUFFS_VN_IOCTL);
1788 }
1789
1790 int
1791 puffs_fcntl(void *v)
1792 {
1793
1794 return puffs_fcnioctl(v, PUFFS_VN_FCNTL);
1795 }
1796
1797 int
1798 puffs_print(void *v)
1799 {
1800 struct vop_print_args /* {
1801 struct vnode *a_vp;
1802 } */ *ap = v;
1803 struct puffs_mount *pmp;
1804 struct vnode *vp = ap->a_vp;
1805 struct puffs_node *pn = vp->v_data;
1806
1807 PUFFS_VNREQ(print);
1808
1809 pmp = MPTOPUFFSMP(vp->v_mount);
1810
1811 /* kernel portion */
1812 printf("tag VT_PUFFS, vnode %p, puffs node: %p,\n"
1813 " userspace cookie: %p\n", vp, pn, pn->pn_cookie);
1814 if (vp->v_type == VFIFO)
1815 fifo_printinfo(vp);
1816 lockmgr_printinfo(&vp->v_lock);
1817
1818 /* userspace portion */
1819 if (EXISTSOP(pmp, PRINT))
1820 puffs_vntouser(pmp, PUFFS_VN_PRINT,
1821 &print_arg, sizeof(print_arg), 0, ap->a_vp, NULL);
1822
1823 return 0;
1824 }
1825
1826 int
1827 puffs_pathconf(void *v)
1828 {
1829 struct vop_pathconf_args /* {
1830 const struct vnodeop_desc *a_desc;
1831 struct vnode *a_vp;
1832 int a_name;
1833 register_t *a_retval;
1834 } */ *ap = v;
1835 int error;
1836
1837 PUFFS_VNREQ(pathconf);
1838
1839 pathconf_arg.pvnr_name = ap->a_name;
1840
1841 error = puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount),
1842 PUFFS_VN_PATHCONF, &pathconf_arg, sizeof(pathconf_arg), 0,
1843 ap->a_vp, NULL);
1844 if (error)
1845 return error;
1846
1847 *ap->a_retval = pathconf_arg.pvnr_retval;
1848
1849 return 0;
1850 }
1851
1852 int
1853 puffs_advlock(void *v)
1854 {
1855 struct vop_advlock_args /* {
1856 const struct vnodeop_desc *a_desc;
1857 struct vnode *a_vp;
1858 void *a_id;
1859 int a_op;
1860 struct flock *a_fl;
1861 int a_flags;
1862 } */ *ap = v;
1863 int error;
1864
1865 PUFFS_VNREQ(advlock);
1866
1867 error = copyin(ap->a_fl, &advlock_arg.pvnr_fl, sizeof(struct flock));
1868 if (error)
1869 return error;
1870 advlock_arg.pvnr_id = ap->a_id;
1871 advlock_arg.pvnr_op = ap->a_op;
1872 advlock_arg.pvnr_flags = ap->a_flags;
1873
1874 return puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount), PUFFS_VN_ADVLOCK,
1875 &advlock_arg, sizeof(advlock_arg), 0, ap->a_vp, NULL);
1876 }
1877
1878 #define BIOASYNC(bp) (bp->b_flags & B_ASYNC)
1879 #define BIOREAD(bp) (bp->b_flags & B_READ)
1880 #define BIOWRITE(bp) ((bp->b_flags & B_READ) == 0)
1881
1882 /*
1883 * This maps itself to PUFFS_VN_READ/WRITE for data transfer.
1884 */
1885 int
1886 puffs_strategy(void *v)
1887 {
1888 struct vop_strategy_args /* {
1889 const struct vnodeop_desc *a_desc;
1890 struct vnode *a_vp;
1891 struct buf *a_bp;
1892 } */ *ap = v;
1893 struct puffs_mount *pmp;
1894 struct vnode *vp = ap->a_vp;
1895 struct puffs_node *pn;
1896 struct puffs_vnreq_readwrite *rw_argp = NULL;
1897 struct buf *bp;
1898 size_t argsize;
1899 size_t tomove, moved;
1900 int error, dofaf;
1901
1902 pmp = MPTOPUFFSMP(vp->v_mount);
1903 bp = ap->a_bp;
1904 error = 0;
1905 dofaf = 0;
1906 pn = VPTOPP(vp);
1907
1908 if ((BIOREAD(bp) && !EXISTSOP(pmp, READ))
1909 || (BIOWRITE(bp) && !EXISTSOP(pmp, WRITE)))
1910 ERROUT(EOPNOTSUPP);
1911
1912 /*
1913 * Short-circuit optimization: don't flush buffer in between
1914 * VOP_INACTIVE and VOP_RECLAIM in case the node has no references.
1915 */
1916 if (pn->pn_stat & PNODE_DYING) {
1917 KASSERT(BIOWRITE(bp));
1918 bp->b_resid = 0;
1919 goto out;
1920 }
1921
1922 #ifdef DIAGNOSTIC
1923 if (bp->b_bcount > pmp->pmp_req_maxsize - PUFFS_REQSTRUCT_MAX)
1924 panic("puffs_strategy: wildly inappropriate buf bcount %d",
1925 bp->b_bcount);
1926 #endif
1927
1928 /*
1929 * See explanation for the necessity of a FAF in puffs_fsync.
1930 *
1931 * Also, do FAF in case we're suspending.
1932 * See puffs_vfsops.c:pageflush()
1933 */
1934 if (BIOWRITE(bp)) {
1935 simple_lock(&vp->v_interlock);
1936 if (vp->v_flag & VXLOCK)
1937 dofaf = 1;
1938 if (pn->pn_stat & PNODE_SUSPEND)
1939 dofaf = 1;
1940 simple_unlock(&vp->v_interlock);
1941 }
1942
1943 if (BIOASYNC(bp))
1944 dofaf = 1;
1945
1946 #ifdef DIAGNOSTIC
1947 if (curproc == uvm.pagedaemon_proc)
1948 KASSERT(dofaf);
1949 #endif
1950
1951 /* allocate transport structure */
1952 tomove = PUFFS_TOMOVE(bp->b_bcount, pmp);
1953 argsize = sizeof(struct puffs_vnreq_readwrite);
1954 rw_argp = malloc(argsize + tomove, M_PUFFS,
1955 M_ZERO | (dofaf ? M_NOWAIT : M_WAITOK));
1956 if (rw_argp == NULL)
1957 ERROUT(ENOMEM);
1958 RWARGS(rw_argp, 0, tomove, bp->b_blkno << DEV_BSHIFT, FSCRED);
1959
1960 /* 2x2 cases: read/write, faf/nofaf */
1961 if (BIOREAD(bp)) {
1962 if (dofaf) {
1963 puffs_vntouser_call(pmp, PUFFS_VN_READ, rw_argp,
1964 argsize, tomove, puffs_parkdone_asyncbioread,
1965 bp, vp, NULL);
1966 } else {
1967 error = puffs_vntouser(pmp, PUFFS_VN_READ,
1968 rw_argp, argsize, tomove, vp, NULL);
1969 if (error)
1970 goto out;
1971
1972 if (rw_argp->pvnr_resid > tomove)
1973 ERROUT(EINVAL);
1974
1975 moved = tomove - rw_argp->pvnr_resid;
1976
1977 (void)memcpy(bp->b_data, rw_argp->pvnr_data, moved);
1978 bp->b_resid = bp->b_bcount - moved;
1979 }
1980 } else {
1981 /*
1982 * make pages read-only before we write them if we want
1983 * write caching info
1984 */
1985 if (PUFFS_WCACHEINFO(pmp)) {
1986 struct uvm_object *uobj = &vp->v_uobj;
1987 int npages = (bp->b_bcount + PAGE_SIZE-1) >> PAGE_SHIFT;
1988 struct vm_page *vmp;
1989 int i;
1990
1991 for (i = 0; i < npages; i++) {
1992 vmp= uvm_pageratop((vaddr_t)bp->b_data
1993 + (i << PAGE_SHIFT));
1994 DPRINTF(("puffs_strategy: write-protecting "
1995 "vp %p page %p, offset %" PRId64"\n",
1996 vp, vmp, vmp->offset));
1997 simple_lock(&uobj->vmobjlock);
1998 vmp->flags |= PG_RDONLY;
1999 pmap_page_protect(vmp, VM_PROT_READ);
2000 simple_unlock(&uobj->vmobjlock);
2001 }
2002 }
2003
2004 (void)memcpy(&rw_argp->pvnr_data, bp->b_data, tomove);
2005 if (dofaf) {
2006 /*
2007 * assume FAF moves everything. frankly, we don't
2008 * really have a choice.
2009 */
2010 puffs_vntouser_faf(MPTOPUFFSMP(vp->v_mount),
2011 PUFFS_VN_WRITE, rw_argp, argsize + tomove, vp);
2012 bp->b_resid = bp->b_bcount - tomove;
2013 } else {
2014 error = puffs_vntouser(MPTOPUFFSMP(vp->v_mount),
2015 PUFFS_VN_WRITE, rw_argp, argsize + tomove,
2016 0, vp, NULL);
2017 if (error)
2018 goto out;
2019
2020 moved = tomove - rw_argp->pvnr_resid;
2021 if (rw_argp->pvnr_resid > tomove)
2022 ERROUT(EINVAL);
2023
2024 bp->b_resid = bp->b_bcount - moved;
2025 if (rw_argp->pvnr_resid != 0)
2026 ERROUT(EIO);
2027 }
2028 }
2029
2030 out:
2031 KASSERT(dofaf == 0 || error == 0);
2032 if (rw_argp && !dofaf)
2033 free(rw_argp, M_PUFFS);
2034
2035 if (error) {
2036 bp->b_error = error;
2037 bp->b_flags |= B_ERROR;
2038 }
2039
2040 if (error || !(BIOREAD(bp) && BIOASYNC(bp)))
2041 biodone(bp);
2042
2043 return error;
2044 }
2045
2046 int
2047 puffs_mmap(void *v)
2048 {
2049 struct vop_mmap_args /* {
2050 const struct vnodeop_desc *a_desc;
2051 struct vnode *a_vp;
2052 int a_fflags;
2053 kauth_cred_t a_cred;
2054 struct lwp *a_l;
2055 } */ *ap = v;
2056 struct puffs_mount *pmp;
2057 int error;
2058
2059 PUFFS_VNREQ(mmap);
2060
2061 pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
2062
2063 if (!PUFFS_USE_PAGECACHE(pmp))
2064 return genfs_eopnotsupp(v);
2065
2066 if (EXISTSOP(pmp, MMAP)) {
2067 mmap_arg.pvnr_fflags = ap->a_fflags;
2068 puffs_credcvt(&mmap_arg.pvnr_cred, ap->a_cred);
2069 puffs_cidcvt(&mmap_arg.pvnr_cid, ap->a_l);
2070
2071 error = puffs_vntouser(pmp, PUFFS_VN_MMAP,
2072 &mmap_arg, sizeof(mmap_arg), 0,
2073 ap->a_vp, NULL);
2074 } else {
2075 error = genfs_mmap(v);
2076 }
2077
2078 return error;
2079 }
2080
2081
2082 /*
2083 * The rest don't get a free trip to userspace and back, they
2084 * have to stay within the kernel.
2085 */
2086
2087 /*
2088 * bmap doesn't really make any sense for puffs, so just 1:1 map it.
2089 * well, maybe somehow, somewhere, some day ....
2090 */
2091 int
2092 puffs_bmap(void *v)
2093 {
2094 struct vop_bmap_args /* {
2095 const struct vnodeop_desc *a_desc;
2096 struct vnode *a_vp;
2097 daddr_t a_bn;
2098 struct vnode **a_vpp;
2099 daddr_t *a_bnp;
2100 int *a_runp;
2101 } */ *ap = v;
2102 struct puffs_mount *pmp;
2103
2104 pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
2105
2106 if (ap->a_vpp)
2107 *ap->a_vpp = ap->a_vp;
2108 if (ap->a_bnp)
2109 *ap->a_bnp = ap->a_bn;
2110 if (ap->a_runp)
2111 *ap->a_runp
2112 = (PUFFS_TOMOVE(pmp->pmp_req_maxsize, pmp)>>DEV_BSHIFT) - 1;
2113
2114 return 0;
2115 }
2116
2117 /*
2118 * Handle getpages faults in puffs. We let genfs_getpages() do most
2119 * of the dirty work, but we come in this route to do accounting tasks.
2120 * If the user server has specified functions for cache notifications
2121 * about reads and/or writes, we record which type of operation we got,
2122 * for which page range, and proceed to issue a FAF notification to the
2123 * server about it.
2124 */
2125 int
2126 puffs_getpages(void *v)
2127 {
2128 struct vop_getpages_args /* {
2129 const struct vnodeop_desc *a_desc;
2130 struct vnode *a_vp;
2131 voff_t a_offset;
2132 struct vm_page **a_m;
2133 int *a_count;
2134 int a_centeridx;
2135 vm_prot_t a_access_type;
2136 int a_advice;
2137 int a_flags;
2138 } */ *ap = v;
2139 struct puffs_mount *pmp;
2140 struct vnode *vp;
2141 struct vm_page **pgs;
2142 struct puffs_cacheinfo *pcinfo = NULL;
2143 struct puffs_cacherun *pcrun;
2144 void *parkmem = NULL;
2145 size_t runsizes;
2146 int i, npages, si, streakon;
2147 int error, locked, write;
2148
2149 pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
2150 npages = *ap->a_count;
2151 pgs = ap->a_m;
2152 vp = ap->a_vp;
2153 locked = (ap->a_flags & PGO_LOCKED) != 0;
2154 write = (ap->a_access_type & VM_PROT_WRITE) != 0;
2155
2156 /* ccg xnaht - gets Wuninitialized wrong */
2157 pcrun = NULL;
2158 runsizes = 0;
2159
2160 if (write && PUFFS_WCACHEINFO(pmp)) {
2161 /* allocate worst-case memory */
2162 runsizes = ((npages / 2) + 1) * sizeof(struct puffs_cacherun);
2163 pcinfo = malloc(sizeof(struct puffs_cacheinfo) + runsizes,
2164 M_PUFFS, M_ZERO | locked ? M_NOWAIT : M_WAITOK);
2165
2166 /*
2167 * can't block if we're locked and can't mess up caching
2168 * information for fs server. so come back later, please
2169 */
2170 if (pcinfo == NULL)
2171 ERROUT(ENOMEM);
2172
2173 parkmem = puffs_park_alloc(locked == 0);
2174 if (parkmem == NULL)
2175 ERROUT(ENOMEM);
2176
2177 pcrun = pcinfo->pcache_runs;
2178 }
2179
2180 error = genfs_getpages(v);
2181 if (error)
2182 goto out;
2183
2184 if (PUFFS_WCACHEINFO(pmp) == 0)
2185 goto out;
2186
2187 /*
2188 * Let's see whose fault it was and inform the user server of
2189 * possibly read/written pages. Map pages from read faults
2190 * strictly read-only, since otherwise we might miss info on
2191 * when the page is actually write-faulted to.
2192 */
2193 if (!locked)
2194 simple_lock(&vp->v_uobj.vmobjlock);
2195 for (i = 0, si = 0, streakon = 0; i < npages; i++) {
2196 if (pgs[i] == NULL || pgs[i] == PGO_DONTCARE) {
2197 if (streakon && write) {
2198 streakon = 0;
2199 pcrun[si].pcache_runend
2200 = trunc_page(pgs[i]->offset) + PAGE_MASK;
2201 si++;
2202 }
2203 continue;
2204 }
2205 if (streakon == 0 && write) {
2206 streakon = 1;
2207 pcrun[si].pcache_runstart = pgs[i]->offset;
2208 }
2209
2210 if (!write)
2211 pgs[i]->flags |= PG_RDONLY;
2212 }
2213 /* was the last page part of our streak? */
2214 if (streakon) {
2215 pcrun[si].pcache_runend
2216 = trunc_page(pgs[i-1]->offset) + PAGE_MASK;
2217 si++;
2218 }
2219 if (!locked)
2220 simple_unlock(&vp->v_uobj.vmobjlock);
2221
2222 KASSERT(si <= (npages / 2) + 1);
2223
2224 /* send results to userspace */
2225 if (write)
2226 puffs_cacheop(pmp, parkmem, pcinfo,
2227 sizeof(struct puffs_cacheinfo) + runsizes, VPTOPNC(vp));
2228
2229 out:
2230 if (error) {
2231 if (pcinfo != NULL)
2232 free(pcinfo, M_PUFFS);
2233 if (parkmem != NULL)
2234 puffs_park_release(parkmem, 1);
2235 }
2236
2237 return error;
2238 }
2239
2240 int
2241 puffs_lock(void *v)
2242 {
2243 struct vop_lock_args /* {
2244 struct vnode *a_vp;
2245 int a_flags;
2246 }*/ *ap = v;
2247 struct vnode *vp = ap->a_vp;
2248 struct mount *mp = vp->v_mount;
2249
2250 #if 0
2251 DPRINTF(("puffs_lock: lock %p, args 0x%x\n", vp, ap->a_flags));
2252 #endif
2253
2254 /*
2255 * XXX: this avoids deadlocking when we're suspending.
2256 * e.g. some ops holding the vnode lock might be blocked for
2257 * the vfs transaction lock so we'd deadlock.
2258 *
2259 * Now once again this is skating on the thin ice of modern life,
2260 * since we are breaking the consistency guarantee provided
2261 * _to the user server_ by vnode locking. Hopefully this will
2262 * get fixed soon enough by getting rid of the dependency on
2263 * vnode locks alltogether.
2264 */
2265 if (fstrans_is_owner(mp) && fstrans_getstate(mp) == FSTRANS_SUSPENDING){
2266 if (ap->a_flags & LK_INTERLOCK)
2267 simple_unlock(&vp->v_interlock);
2268 return 0;
2269 }
2270
2271 return lockmgr(&vp->v_lock, ap->a_flags, &vp->v_interlock);
2272 }
2273
2274 int
2275 puffs_unlock(void *v)
2276 {
2277 struct vop_unlock_args /* {
2278 struct vnode *a_vp;
2279 int a_flags;
2280 } */ *ap = v;
2281 struct vnode *vp = ap->a_vp;
2282 struct mount *mp = vp->v_mount;
2283
2284 #if 0
2285 DPRINTF(("puffs_unlock: lock %p, args 0x%x\n", vp, ap->a_flags));
2286 #endif
2287
2288 /* XXX: see puffs_lock() */
2289 if (fstrans_is_owner(mp) && fstrans_getstate(mp) == FSTRANS_SUSPENDING){
2290 if (ap->a_flags & LK_INTERLOCK)
2291 simple_unlock(&vp->v_interlock);
2292 return 0;
2293 }
2294
2295 return lockmgr(&vp->v_lock, ap->a_flags | LK_RELEASE, &vp->v_interlock);
2296 }
2297
2298 int
2299 puffs_islocked(void *v)
2300 {
2301 struct vop_islocked_args *ap = v;
2302 int rv;
2303
2304 rv = lockstatus(&ap->a_vp->v_lock);
2305 return rv;
2306 }
2307
2308 int
2309 puffs_generic(void *v)
2310 {
2311 struct vop_generic_args *ap = v;
2312
2313 (void)ap;
2314 DPRINTF(("puffs_generic: ap->a_desc = %s\n", ap->a_desc->vdesc_name));
2315
2316 return EOPNOTSUPP;
2317 }
2318
2319
2320 /*
2321 * spec & fifo. These call the miscfs spec and fifo vectors, but issue
2322 * FAF update information for the puffs node first.
2323 */
2324 int
2325 puffs_spec_read(void *v)
2326 {
2327 struct vop_read_args /* {
2328 const struct vnodeop_desc *a_desc;
2329 struct vnode *a_vp;
2330 struct uio *a_uio;
2331 int a_ioflag;
2332 kauth_cred_t a_cred;
2333 } */ *ap = v;
2334
2335 puffs_updatenode(ap->a_vp, PUFFS_UPDATEATIME);
2336 return VOCALL(spec_vnodeop_p, VOFFSET(vop_read), v);
2337 }
2338
2339 int
2340 puffs_spec_write(void *v)
2341 {
2342 struct vop_write_args /* {
2343 const struct vnodeop_desc *a_desc;
2344 struct vnode *a_vp;
2345 struct uio *a_uio;
2346 int a_ioflag;
2347 kauth_cred_t a_cred;
2348 }*/ *ap = v;
2349
2350 puffs_updatenode(ap->a_vp, PUFFS_UPDATEMTIME);
2351 return VOCALL(spec_vnodeop_p, VOFFSET(vop_write), v);
2352 }
2353
2354 int
2355 puffs_fifo_read(void *v)
2356 {
2357 struct vop_read_args /* {
2358 const struct vnodeop_desc *a_desc;
2359 struct vnode *a_vp;
2360 struct uio *a_uio;
2361 int a_ioflag;
2362 kauth_cred_t a_cred;
2363 } */ *ap = v;
2364
2365 puffs_updatenode(ap->a_vp, PUFFS_UPDATEATIME);
2366 return VOCALL(fifo_vnodeop_p, VOFFSET(vop_read), v);
2367 }
2368
2369 int
2370 puffs_fifo_write(void *v)
2371 {
2372 struct vop_write_args /* {
2373 const struct vnodeop_desc *a_desc;
2374 struct vnode *a_vp;
2375 struct uio *a_uio;
2376 int a_ioflag;
2377 kauth_cred_t a_cred;
2378 }*/ *ap = v;
2379
2380 puffs_updatenode(ap->a_vp, PUFFS_UPDATEMTIME);
2381 return VOCALL(fifo_vnodeop_p, VOFFSET(vop_write), v);
2382 }
2383