puffs_vnops.c revision 1.73 1 /* $NetBSD: puffs_vnops.c,v 1.73 2007/06/01 15:59:37 yamt Exp $ */
2
3 /*
4 * Copyright (c) 2005, 2006, 2007 Antti Kantee. All Rights Reserved.
5 *
6 * Development of this software was supported by the
7 * Google Summer of Code program and the Ulla Tuominen Foundation.
8 * The Google SoC project was mentored by Bill Studenmund.
9 *
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
12 * are met:
13 * 1. Redistributions of source code must retain the above copyright
14 * notice, this list of conditions and the following disclaimer.
15 * 2. Redistributions in binary form must reproduce the above copyright
16 * notice, this list of conditions and the following disclaimer in the
17 * documentation and/or other materials provided with the distribution.
18 * 3. The name of the company nor the name of the author may be used to
19 * endorse or promote products derived from this software without specific
20 * prior written permission.
21 *
22 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
23 * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
24 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
25 * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
26 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
28 * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32 * SUCH DAMAGE.
33 */
34
35 #include <sys/cdefs.h>
36 __KERNEL_RCSID(0, "$NetBSD: puffs_vnops.c,v 1.73 2007/06/01 15:59:37 yamt Exp $");
37
38 #include <sys/param.h>
39 #include <sys/fstrans.h>
40 #include <sys/malloc.h>
41 #include <sys/mount.h>
42 #include <sys/namei.h>
43 #include <sys/vnode.h>
44 #include <uvm/uvm.h>
45
46 #include <fs/puffs/puffs_msgif.h>
47 #include <fs/puffs/puffs_sys.h>
48
49 #include <miscfs/fifofs/fifo.h>
50 #include <miscfs/genfs/genfs.h>
51 #include <miscfs/specfs/specdev.h>
52
53 int puffs_lookup(void *);
54 int puffs_create(void *);
55 int puffs_access(void *);
56 int puffs_mknod(void *);
57 int puffs_open(void *);
58 int puffs_close(void *);
59 int puffs_getattr(void *);
60 int puffs_setattr(void *);
61 int puffs_reclaim(void *);
62 int puffs_readdir(void *);
63 int puffs_poll(void *);
64 int puffs_fsync(void *);
65 int puffs_seek(void *);
66 int puffs_remove(void *);
67 int puffs_mkdir(void *);
68 int puffs_rmdir(void *);
69 int puffs_link(void *);
70 int puffs_readlink(void *);
71 int puffs_symlink(void *);
72 int puffs_rename(void *);
73 int puffs_read(void *);
74 int puffs_write(void *);
75 int puffs_fcntl(void *);
76 int puffs_ioctl(void *);
77 int puffs_inactive(void *);
78 int puffs_print(void *);
79 int puffs_pathconf(void *);
80 int puffs_advlock(void *);
81 int puffs_strategy(void *);
82 int puffs_bmap(void *);
83 int puffs_mmap(void *);
84 int puffs_getpages(void *);
85
86 int puffs_spec_read(void *);
87 int puffs_spec_write(void *);
88 int puffs_fifo_read(void *);
89 int puffs_fifo_write(void *);
90
91 int puffs_checkop(void *);
92
93
94 /* VOP_LEASE() not included */
95
96 int puffs_generic(void *);
97
98 #if 0
99 #define puffs_lock genfs_lock
100 #define puffs_unlock genfs_unlock
101 #define puffs_islocked genfs_islocked
102 #else
103 int puffs_lock(void *);
104 int puffs_unlock(void *);
105 int puffs_islocked(void *);
106 #endif
107
108 int (**puffs_vnodeop_p)(void *);
109 const struct vnodeopv_entry_desc puffs_vnodeop_entries[] = {
110 { &vop_default_desc, vn_default_error },
111 { &vop_lookup_desc, puffs_lookup }, /* REAL lookup */
112 { &vop_create_desc, puffs_checkop }, /* create */
113 { &vop_mknod_desc, puffs_checkop }, /* mknod */
114 { &vop_open_desc, puffs_open }, /* REAL open */
115 { &vop_close_desc, puffs_checkop }, /* close */
116 { &vop_access_desc, puffs_access }, /* REAL access */
117 { &vop_getattr_desc, puffs_checkop }, /* getattr */
118 { &vop_setattr_desc, puffs_checkop }, /* setattr */
119 { &vop_read_desc, puffs_checkop }, /* read */
120 { &vop_write_desc, puffs_checkop }, /* write */
121 { &vop_fcntl_desc, puffs_checkop }, /* fcntl */
122 { &vop_ioctl_desc, puffs_checkop }, /* ioctl */
123 { &vop_fsync_desc, puffs_fsync }, /* REAL fsync */
124 { &vop_seek_desc, puffs_checkop }, /* seek */
125 { &vop_remove_desc, puffs_checkop }, /* remove */
126 { &vop_link_desc, puffs_checkop }, /* link */
127 { &vop_rename_desc, puffs_checkop }, /* rename */
128 { &vop_mkdir_desc, puffs_checkop }, /* mkdir */
129 { &vop_rmdir_desc, puffs_checkop }, /* rmdir */
130 { &vop_symlink_desc, puffs_checkop }, /* symlink */
131 { &vop_readdir_desc, puffs_checkop }, /* readdir */
132 { &vop_readlink_desc, puffs_checkop }, /* readlink */
133 { &vop_getpages_desc, puffs_checkop }, /* getpages */
134 { &vop_putpages_desc, genfs_putpages }, /* REAL putpages */
135 { &vop_pathconf_desc, puffs_checkop }, /* pathconf */
136 { &vop_advlock_desc, puffs_checkop }, /* advlock */
137 { &vop_strategy_desc, puffs_strategy }, /* REAL strategy */
138 { &vop_revoke_desc, genfs_revoke }, /* REAL revoke */
139 { &vop_abortop_desc, genfs_abortop }, /* REAL abortop */
140 { &vop_inactive_desc, puffs_inactive }, /* REAL inactive */
141 { &vop_reclaim_desc, puffs_reclaim }, /* REAL reclaim */
142 { &vop_lock_desc, puffs_lock }, /* REAL lock */
143 { &vop_unlock_desc, puffs_unlock }, /* REAL unlock */
144 { &vop_bmap_desc, puffs_bmap }, /* REAL bmap */
145 { &vop_print_desc, puffs_print }, /* REAL print */
146 { &vop_islocked_desc, puffs_islocked }, /* REAL islocked */
147 { &vop_bwrite_desc, genfs_nullop }, /* REAL bwrite */
148 { &vop_mmap_desc, puffs_mmap }, /* REAL mmap */
149 { &vop_poll_desc, puffs_poll }, /* REAL poll */
150
151 { &vop_kqfilter_desc, genfs_eopnotsupp }, /* kqfilter XXX */
152 { NULL, NULL }
153 };
154 const struct vnodeopv_desc puffs_vnodeop_opv_desc =
155 { &puffs_vnodeop_p, puffs_vnodeop_entries };
156
157
158 int (**puffs_specop_p)(void *);
159 const struct vnodeopv_entry_desc puffs_specop_entries[] = {
160 { &vop_default_desc, vn_default_error },
161 { &vop_lookup_desc, spec_lookup }, /* lookup, ENOTDIR */
162 { &vop_create_desc, spec_create }, /* genfs_badop */
163 { &vop_mknod_desc, spec_mknod }, /* genfs_badop */
164 { &vop_open_desc, spec_open }, /* spec_open */
165 { &vop_close_desc, spec_close }, /* spec_close */
166 { &vop_access_desc, puffs_checkop }, /* access */
167 { &vop_getattr_desc, puffs_checkop }, /* getattr */
168 { &vop_setattr_desc, puffs_checkop }, /* setattr */
169 { &vop_read_desc, puffs_spec_read }, /* update, read */
170 { &vop_write_desc, puffs_spec_write }, /* update, write */
171 { &vop_lease_desc, spec_lease_check }, /* genfs_nullop */
172 { &vop_ioctl_desc, spec_ioctl }, /* spec_ioctl */
173 { &vop_fcntl_desc, genfs_fcntl }, /* dummy */
174 { &vop_poll_desc, spec_poll }, /* spec_poll */
175 { &vop_kqfilter_desc, spec_kqfilter }, /* spec_kqfilter */
176 { &vop_revoke_desc, spec_revoke }, /* genfs_revoke */
177 { &vop_mmap_desc, spec_mmap }, /* spec_mmap */
178 { &vop_fsync_desc, spec_fsync }, /* vflushbuf */
179 { &vop_seek_desc, spec_seek }, /* genfs_nullop */
180 { &vop_remove_desc, spec_remove }, /* genfs_badop */
181 { &vop_link_desc, spec_link }, /* genfs_badop */
182 { &vop_rename_desc, spec_rename }, /* genfs_badop */
183 { &vop_mkdir_desc, spec_mkdir }, /* genfs_badop */
184 { &vop_rmdir_desc, spec_rmdir }, /* genfs_badop */
185 { &vop_symlink_desc, spec_symlink }, /* genfs_badop */
186 { &vop_readdir_desc, spec_readdir }, /* genfs_badop */
187 { &vop_readlink_desc, spec_readlink }, /* genfs_badop */
188 { &vop_abortop_desc, spec_abortop }, /* genfs_badop */
189 { &vop_inactive_desc, puffs_inactive }, /* REAL inactive */
190 { &vop_reclaim_desc, puffs_reclaim }, /* REAL reclaim */
191 { &vop_lock_desc, puffs_lock }, /* REAL lock */
192 { &vop_unlock_desc, puffs_unlock }, /* REAL unlock */
193 { &vop_bmap_desc, spec_bmap }, /* dummy */
194 { &vop_strategy_desc, spec_strategy }, /* dev strategy */
195 { &vop_print_desc, puffs_print }, /* REAL print */
196 { &vop_islocked_desc, puffs_islocked }, /* REAL islocked */
197 { &vop_pathconf_desc, spec_pathconf }, /* pathconf */
198 { &vop_advlock_desc, spec_advlock }, /* lf_advlock */
199 { &vop_bwrite_desc, vn_bwrite }, /* bwrite */
200 { &vop_getpages_desc, spec_getpages }, /* genfs_getpages */
201 { &vop_putpages_desc, spec_putpages }, /* genfs_putpages */
202 #if 0
203 { &vop_openextattr_desc, _openextattr }, /* openextattr */
204 { &vop_closeextattr_desc, _closeextattr }, /* closeextattr */
205 { &vop_getextattr_desc, _getextattr }, /* getextattr */
206 { &vop_setextattr_desc, _setextattr }, /* setextattr */
207 { &vop_listextattr_desc, _listextattr }, /* listextattr */
208 { &vop_deleteextattr_desc, _deleteextattr }, /* deleteextattr */
209 #endif
210 { NULL, NULL }
211 };
212 const struct vnodeopv_desc puffs_specop_opv_desc =
213 { &puffs_specop_p, puffs_specop_entries };
214
215
216 int (**puffs_fifoop_p)(void *);
217 const struct vnodeopv_entry_desc puffs_fifoop_entries[] = {
218 { &vop_default_desc, vn_default_error },
219 { &vop_lookup_desc, fifo_lookup }, /* lookup, ENOTDIR */
220 { &vop_create_desc, fifo_create }, /* genfs_badop */
221 { &vop_mknod_desc, fifo_mknod }, /* genfs_badop */
222 { &vop_open_desc, fifo_open }, /* open */
223 { &vop_close_desc, fifo_close }, /* close */
224 { &vop_access_desc, puffs_checkop }, /* access */
225 { &vop_getattr_desc, puffs_checkop }, /* getattr */
226 { &vop_setattr_desc, puffs_checkop }, /* setattr */
227 { &vop_read_desc, puffs_fifo_read }, /* read, update */
228 { &vop_write_desc, puffs_fifo_write }, /* write, update */
229 { &vop_lease_desc, fifo_lease_check }, /* genfs_nullop */
230 { &vop_ioctl_desc, fifo_ioctl }, /* ioctl */
231 { &vop_fcntl_desc, genfs_fcntl }, /* dummy */
232 { &vop_poll_desc, fifo_poll }, /* poll */
233 { &vop_kqfilter_desc, fifo_kqfilter }, /* kqfilter */
234 { &vop_revoke_desc, fifo_revoke }, /* genfs_revoke */
235 { &vop_mmap_desc, fifo_mmap }, /* genfs_badop */
236 { &vop_fsync_desc, fifo_fsync }, /* genfs_nullop*/
237 { &vop_seek_desc, fifo_seek }, /* genfs_badop */
238 { &vop_remove_desc, fifo_remove }, /* genfs_badop */
239 { &vop_link_desc, fifo_link }, /* genfs_badop */
240 { &vop_rename_desc, fifo_rename }, /* genfs_badop */
241 { &vop_mkdir_desc, fifo_mkdir }, /* genfs_badop */
242 { &vop_rmdir_desc, fifo_rmdir }, /* genfs_badop */
243 { &vop_symlink_desc, fifo_symlink }, /* genfs_badop */
244 { &vop_readdir_desc, fifo_readdir }, /* genfs_badop */
245 { &vop_readlink_desc, fifo_readlink }, /* genfs_badop */
246 { &vop_abortop_desc, fifo_abortop }, /* genfs_badop */
247 { &vop_inactive_desc, puffs_inactive }, /* REAL inactive */
248 { &vop_reclaim_desc, puffs_reclaim }, /* REAL reclaim */
249 { &vop_lock_desc, puffs_lock }, /* REAL lock */
250 { &vop_unlock_desc, puffs_unlock }, /* REAL unlock */
251 { &vop_bmap_desc, fifo_bmap }, /* dummy */
252 { &vop_strategy_desc, fifo_strategy }, /* genfs_badop */
253 { &vop_print_desc, puffs_print }, /* REAL print */
254 { &vop_islocked_desc, puffs_islocked }, /* REAL islocked */
255 { &vop_pathconf_desc, fifo_pathconf }, /* pathconf */
256 { &vop_advlock_desc, fifo_advlock }, /* genfs_einval */
257 { &vop_bwrite_desc, vn_bwrite }, /* bwrite */
258 { &vop_putpages_desc, fifo_putpages }, /* genfs_null_putpages*/
259 #if 0
260 { &vop_openextattr_desc, _openextattr }, /* openextattr */
261 { &vop_closeextattr_desc, _closeextattr }, /* closeextattr */
262 { &vop_getextattr_desc, _getextattr }, /* getextattr */
263 { &vop_setextattr_desc, _setextattr }, /* setextattr */
264 { &vop_listextattr_desc, _listextattr }, /* listextattr */
265 { &vop_deleteextattr_desc, _deleteextattr }, /* deleteextattr */
266 #endif
267 { NULL, NULL }
268 };
269 const struct vnodeopv_desc puffs_fifoop_opv_desc =
270 { &puffs_fifoop_p, puffs_fifoop_entries };
271
272
273 /* "real" vnode operations */
274 int (**puffs_msgop_p)(void *);
275 const struct vnodeopv_entry_desc puffs_msgop_entries[] = {
276 { &vop_default_desc, vn_default_error },
277 { &vop_create_desc, puffs_create }, /* create */
278 { &vop_mknod_desc, puffs_mknod }, /* mknod */
279 { &vop_open_desc, puffs_open }, /* open */
280 { &vop_close_desc, puffs_close }, /* close */
281 { &vop_access_desc, puffs_access }, /* access */
282 { &vop_getattr_desc, puffs_getattr }, /* getattr */
283 { &vop_setattr_desc, puffs_setattr }, /* setattr */
284 { &vop_read_desc, puffs_read }, /* read */
285 { &vop_write_desc, puffs_write }, /* write */
286 { &vop_fcntl_desc, puffs_fcntl }, /* fcntl */
287 { &vop_ioctl_desc, puffs_ioctl }, /* ioctl */
288 { &vop_seek_desc, puffs_seek }, /* seek */
289 { &vop_remove_desc, puffs_remove }, /* remove */
290 { &vop_link_desc, puffs_link }, /* link */
291 { &vop_rename_desc, puffs_rename }, /* rename */
292 { &vop_mkdir_desc, puffs_mkdir }, /* mkdir */
293 { &vop_rmdir_desc, puffs_rmdir }, /* rmdir */
294 { &vop_symlink_desc, puffs_symlink }, /* symlink */
295 { &vop_readdir_desc, puffs_readdir }, /* readdir */
296 { &vop_readlink_desc, puffs_readlink }, /* readlink */
297 { &vop_print_desc, puffs_print }, /* print */
298 { &vop_islocked_desc, puffs_islocked }, /* islocked */
299 { &vop_pathconf_desc, puffs_pathconf }, /* pathconf */
300 { &vop_advlock_desc, puffs_advlock }, /* advlock */
301 { &vop_getpages_desc, puffs_getpages }, /* getpages */
302 { NULL, NULL }
303 };
304 const struct vnodeopv_desc puffs_msgop_opv_desc =
305 { &puffs_msgop_p, puffs_msgop_entries };
306
307
308 #define LOCKEDVP(a) (VOP_ISLOCKED(a) ? (a) : NULL)
309
310
311 /*
312 * This is a generic vnode operation handler. It checks if the necessary
313 * operations for the called vnode operation are implemented by userspace
314 * and either returns a dummy return value or proceeds to call the real
315 * vnode operation from puffs_msgop_v.
316 *
317 * XXX: this should described elsewhere and autogenerated, the complexity
318 * of the vnode operations vectors and their interrelationships is also
319 * getting a bit out of hand. Another problem is that we need this same
320 * information in the fs server code, so keeping the two in sync manually
321 * is not a viable (long term) plan.
322 */
323
324 /* not supported, handle locking protocol */
325 #define CHECKOP_NOTSUPP(op) \
326 case VOP_##op##_DESCOFFSET: \
327 if (pmp->pmp_vnopmask[PUFFS_VN_##op] == 0) \
328 return genfs_eopnotsupp(v); \
329 break
330
331 /* always succeed, no locking */
332 #define CHECKOP_SUCCESS(op) \
333 case VOP_##op##_DESCOFFSET: \
334 if (pmp->pmp_vnopmask[PUFFS_VN_##op] == 0) \
335 return 0; \
336 break
337
338 int
339 puffs_checkop(void *v)
340 {
341 struct vop_generic_args /* {
342 struct vnodeop_desc *a_desc;
343 spooky mystery contents;
344 } */ *ap = v;
345 struct vnodeop_desc *desc = ap->a_desc;
346 struct puffs_mount *pmp;
347 struct vnode *vp;
348 int offset;
349
350 DPRINTF_VERBOSE(("checkop call %s (%d)\n",
351 ap->a_desc->vdesc_name, ap->a_desc->vdesc_offset));
352
353 offset = ap->a_desc->vdesc_vp_offsets[0];
354 #ifdef DIAGNOSTIC
355 if (offset == VDESC_NO_OFFSET)
356 panic("puffs_checkop: no vnode, why did you call me?");
357 #endif
358 vp = *VOPARG_OFFSETTO(struct vnode **, offset, ap);
359 pmp = MPTOPUFFSMP(vp->v_mount);
360
361 if (!ALLOPS(pmp)) {
362 switch (desc->vdesc_offset) {
363 CHECKOP_NOTSUPP(CREATE);
364 CHECKOP_NOTSUPP(MKNOD);
365 CHECKOP_NOTSUPP(GETATTR);
366 CHECKOP_NOTSUPP(SETATTR);
367 CHECKOP_NOTSUPP(READ);
368 CHECKOP_NOTSUPP(WRITE);
369 CHECKOP_NOTSUPP(FCNTL);
370 CHECKOP_NOTSUPP(IOCTL);
371 CHECKOP_NOTSUPP(REMOVE);
372 CHECKOP_NOTSUPP(LINK);
373 CHECKOP_NOTSUPP(RENAME);
374 CHECKOP_NOTSUPP(MKDIR);
375 CHECKOP_NOTSUPP(RMDIR);
376 CHECKOP_NOTSUPP(SYMLINK);
377 CHECKOP_NOTSUPP(READDIR);
378 CHECKOP_NOTSUPP(READLINK);
379 CHECKOP_NOTSUPP(PRINT);
380 CHECKOP_NOTSUPP(PATHCONF);
381 CHECKOP_NOTSUPP(ADVLOCK);
382
383 CHECKOP_SUCCESS(ACCESS);
384 CHECKOP_SUCCESS(CLOSE);
385 CHECKOP_SUCCESS(SEEK);
386
387 case VOP_GETPAGES_DESCOFFSET:
388 if (!EXISTSOP(pmp, READ))
389 return genfs_eopnotsupp(v);
390 break;
391
392 default:
393 panic("puffs_checkop: unhandled vnop %d",
394 desc->vdesc_offset);
395 }
396 }
397
398 return VOCALL(puffs_msgop_p, ap->a_desc->vdesc_offset, v);
399 }
400
401
402 int
403 puffs_lookup(void *v)
404 {
405 struct vop_lookup_args /* {
406 const struct vnodeop_desc *a_desc;
407 struct vnode *a_dvp;
408 struct vnode **a_vpp;
409 struct componentname *a_cnp;
410 } */ *ap = v;
411 struct puffs_mount *pmp;
412 struct componentname *cnp;
413 struct vnode *vp, *dvp;
414 struct puffs_node *dpn;
415 int isdot;
416 int error;
417
418 PUFFS_VNREQ(lookup);
419
420 pmp = MPTOPUFFSMP(ap->a_dvp->v_mount);
421 cnp = ap->a_cnp;
422 dvp = ap->a_dvp;
423 *ap->a_vpp = NULL;
424
425 /* first things first: check access */
426 error = VOP_ACCESS(dvp, VEXEC, cnp->cn_cred, cnp->cn_lwp);
427 if (error)
428 return error;
429
430 isdot = cnp->cn_namelen == 1 && *cnp->cn_nameptr == '.';
431
432 DPRINTF(("puffs_lookup: \"%s\", parent vnode %p, op: %lx\n",
433 cnp->cn_nameptr, dvp, cnp->cn_nameiop));
434
435 /*
436 * Check if someone fed it into the cache
437 */
438 if (PUFFS_DOCACHE(pmp)) {
439 error = cache_lookup(dvp, ap->a_vpp, cnp);
440
441 if (error >= 0)
442 return error;
443 }
444
445 if (isdot) {
446 vp = ap->a_dvp;
447 vref(vp);
448 *ap->a_vpp = vp;
449 return 0;
450 }
451
452 puffs_makecn(&lookup_arg.pvnr_cn, cnp);
453
454 if (cnp->cn_flags & ISDOTDOT)
455 VOP_UNLOCK(dvp, 0);
456
457 error = puffs_vntouser(pmp, PUFFS_VN_LOOKUP,
458 &lookup_arg, sizeof(lookup_arg), 0, dvp, NULL);
459 DPRINTF(("puffs_lookup: return of the userspace, part %d\n", error));
460
461 /*
462 * In case of error, there is no new vnode to play with, so be
463 * happy with the NULL value given to vpp in the beginning.
464 * Also, check if this really was an error or the target was not
465 * present. Either treat it as a non-error for CREATE/RENAME or
466 * enter the component into the negative name cache (if desired).
467 */
468 if (error) {
469 if (error == ENOENT) {
470 if ((cnp->cn_flags & ISLASTCN)
471 && (cnp->cn_nameiop == CREATE
472 || cnp->cn_nameiop == RENAME)) {
473 cnp->cn_flags |= SAVENAME;
474 error = EJUSTRETURN;
475 } else {
476 if ((cnp->cn_flags & MAKEENTRY)
477 && PUFFS_DOCACHE(pmp))
478 cache_enter(dvp, NULL, cnp);
479 }
480 } else if (error < 0) {
481 error = EINVAL;
482 }
483 goto errout;
484 }
485
486 /*
487 * Check that we don't get our parent node back, that would cause
488 * a pretty obvious deadlock.
489 */
490 dpn = dvp->v_data;
491 if (lookup_arg.pvnr_newnode == dpn->pn_cookie) {
492 error = EINVAL;
493 goto errout;
494 }
495
496 /* XXX: race here */
497 /* XXX2: this check for node existence twice */
498 vp = puffs_pnode2vnode(pmp, lookup_arg.pvnr_newnode, 1);
499 if (!vp) {
500 error = puffs_getvnode(dvp->v_mount,
501 lookup_arg.pvnr_newnode, lookup_arg.pvnr_vtype,
502 lookup_arg.pvnr_size, lookup_arg.pvnr_rdev, &vp);
503 if (error) {
504 goto errout;
505 }
506 vn_lock(vp, LK_EXCLUSIVE | LK_RETRY);
507 }
508 *ap->a_vpp = vp;
509
510 if ((cnp->cn_flags & MAKEENTRY) != 0 && PUFFS_DOCACHE(pmp))
511 cache_enter(dvp, vp, cnp);
512
513 errout:
514 if (cnp->cn_flags & ISDOTDOT)
515 vn_lock(dvp, LK_EXCLUSIVE | LK_RETRY);
516
517 DPRINTF(("puffs_lookup: returning %d %p\n", error, *ap->a_vpp));
518 return error;
519 }
520
521 int
522 puffs_create(void *v)
523 {
524 struct vop_create_args /* {
525 const struct vnodeop_desc *a_desc;
526 struct vnode *a_dvp;
527 struct vnode **a_vpp;
528 struct componentname *a_cnp;
529 struct vattr *a_vap;
530 } */ *ap = v;
531 int error;
532
533 PUFFS_VNREQ(create);
534 DPRINTF(("puffs_create: dvp %p, cnp: %s\n",
535 ap->a_dvp, ap->a_cnp->cn_nameptr));
536
537 puffs_makecn(&create_arg.pvnr_cn, ap->a_cnp);
538 create_arg.pvnr_va = *ap->a_vap;
539
540 error = puffs_vntouser(MPTOPUFFSMP(ap->a_dvp->v_mount), PUFFS_VN_CREATE,
541 &create_arg, sizeof(create_arg), 0, ap->a_dvp, NULL);
542 if (error)
543 goto out;
544
545 error = puffs_newnode(ap->a_dvp->v_mount, ap->a_dvp, ap->a_vpp,
546 create_arg.pvnr_newnode, ap->a_cnp, ap->a_vap->va_type, 0);
547 /* XXX: in case of error, need to uncommit userspace transaction */
548
549 out:
550 if (error || (ap->a_cnp->cn_flags & SAVESTART) == 0)
551 PNBUF_PUT(ap->a_cnp->cn_pnbuf);
552 vput(ap->a_dvp);
553
554 DPRINTF(("puffs_create: return %d\n", error));
555 return error;
556 }
557
558 int
559 puffs_mknod(void *v)
560 {
561 struct vop_mknod_args /* {
562 const struct vnodeop_desc *a_desc;
563 struct vnode *a_dvp;
564 struct vnode **a_vpp;
565 struct componentname *a_cnp;
566 struct vattr *a_vap;
567 } */ *ap = v;
568 int error;
569
570 PUFFS_VNREQ(mknod);
571
572 puffs_makecn(&mknod_arg.pvnr_cn, ap->a_cnp);
573 mknod_arg.pvnr_va = *ap->a_vap;
574
575 error = puffs_vntouser(MPTOPUFFSMP(ap->a_dvp->v_mount), PUFFS_VN_MKNOD,
576 &mknod_arg, sizeof(mknod_arg), 0, ap->a_dvp, NULL);
577 if (error)
578 goto out;
579
580 error = puffs_newnode(ap->a_dvp->v_mount, ap->a_dvp, ap->a_vpp,
581 mknod_arg.pvnr_newnode, ap->a_cnp, ap->a_vap->va_type,
582 ap->a_vap->va_rdev);
583
584 out:
585 if (error || (ap->a_cnp->cn_flags & SAVESTART) == 0)
586 PNBUF_PUT(ap->a_cnp->cn_pnbuf);
587 vput(ap->a_dvp);
588 return error;
589 }
590
591 int
592 puffs_open(void *v)
593 {
594 struct vop_open_args /* {
595 const struct vnodeop_desc *a_desc;
596 struct vnode *a_vp;
597 int a_mode;
598 kauth_cred_t a_cred;
599 struct lwp *a_l;
600 } */ *ap = v;
601 struct vnode *vp = ap->a_vp;
602 struct puffs_mount *pmp = MPTOPUFFSMP(vp->v_mount);
603 int mode = ap->a_mode;
604 int rv;
605
606 PUFFS_VNREQ(open);
607 DPRINTF(("puffs_open: vp %p, mode 0x%x\n", vp, mode));
608
609 if (vp->v_type == VREG && mode & FWRITE && !EXISTSOP(pmp, WRITE)) {
610 rv = EROFS;
611 goto out;
612 }
613
614 if (!EXISTSOP(pmp, OPEN)) {
615 rv = 0;
616 goto out;
617 }
618
619 open_arg.pvnr_mode = mode;
620 puffs_credcvt(&open_arg.pvnr_cred, ap->a_cred);
621 open_arg.pvnr_pid = puffs_lwp2pid(ap->a_l);
622
623 rv = puffs_vntouser(MPTOPUFFSMP(vp->v_mount), PUFFS_VN_OPEN,
624 &open_arg, sizeof(open_arg), 0, vp, NULL);
625
626 out:
627 DPRINTF(("puffs_open: returning %d\n", rv));
628 return rv;
629 }
630
631 int
632 puffs_close(void *v)
633 {
634 struct vop_close_args /* {
635 const struct vnodeop_desc *a_desc;
636 struct vnode *a_vp;
637 int a_fflag;
638 kauth_cred_t a_cred;
639 struct lwp *a_l;
640 } */ *ap = v;
641 struct puffs_vnreq_close *close_argp;
642
643 close_argp = malloc(sizeof(struct puffs_vnreq_close),
644 M_PUFFS, M_WAITOK | M_ZERO);
645 close_argp->pvnr_fflag = ap->a_fflag;
646 puffs_credcvt(&close_argp->pvnr_cred, ap->a_cred);
647 close_argp->pvnr_pid = puffs_lwp2pid(ap->a_l);
648
649 puffs_vntouser_faf(MPTOPUFFSMP(ap->a_vp->v_mount), PUFFS_VN_CLOSE,
650 close_argp, sizeof(struct puffs_vnreq_close), ap->a_vp);
651
652 return 0;
653 }
654
655 int
656 puffs_access(void *v)
657 {
658 struct vop_access_args /* {
659 const struct vnodeop_desc *a_desc;
660 struct vnode *a_vp;
661 int a_mode;
662 kauth_cred_t a_cred;
663 struct lwp *a_l;
664 } */ *ap = v;
665 struct vnode *vp = ap->a_vp;
666 struct puffs_mount *pmp = MPTOPUFFSMP(vp->v_mount);
667 int mode = ap->a_mode;
668
669 PUFFS_VNREQ(access);
670
671 if (vp->v_type == VREG && mode & VWRITE && !EXISTSOP(pmp, WRITE))
672 return EROFS;
673
674 if (!EXISTSOP(pmp, ACCESS))
675 return 0;
676
677 access_arg.pvnr_mode = ap->a_mode;
678 access_arg.pvnr_pid = puffs_lwp2pid(ap->a_l);
679 puffs_credcvt(&access_arg.pvnr_cred, ap->a_cred);
680
681 return puffs_vntouser(MPTOPUFFSMP(vp->v_mount), PUFFS_VN_ACCESS,
682 &access_arg, sizeof(access_arg), 0, vp, NULL);
683 }
684
685 int
686 puffs_getattr(void *v)
687 {
688 struct vop_getattr_args /* {
689 const struct vnodeop_desc *a_desc;
690 struct vnode *a_vp;
691 struct vattr *a_vap;
692 kauth_cred_t a_cred;
693 struct lwp *a_l;
694 } */ *ap = v;
695 struct mount *mp;
696 struct vnode *vp;
697 struct vattr *vap, *rvap;
698 struct puffs_node *pn;
699 int error;
700
701 PUFFS_VNREQ(getattr);
702
703 vp = ap->a_vp;
704 mp = vp->v_mount;
705 vap = ap->a_vap;
706
707 vattr_null(&getattr_arg.pvnr_va);
708 puffs_credcvt(&getattr_arg.pvnr_cred, ap->a_cred);
709 getattr_arg.pvnr_pid = puffs_lwp2pid(ap->a_l);
710
711 error = puffs_vntouser(MPTOPUFFSMP(vp->v_mount), PUFFS_VN_GETATTR,
712 &getattr_arg, sizeof(getattr_arg), 0, vp, NULL);
713 if (error)
714 return error;
715
716 rvap = &getattr_arg.pvnr_va;
717 /*
718 * Don't listen to the file server regarding special device
719 * size info, the file server doesn't know anything about them.
720 */
721 if (vp->v_type == VBLK || vp->v_type == VCHR)
722 rvap->va_size = vp->v_size;
723
724 /* Ditto for blocksize (ufs comment: this doesn't belong here) */
725 if (vp->v_type == VBLK)
726 rvap->va_blocksize = BLKDEV_IOSIZE;
727 else if (vp->v_type == VCHR)
728 rvap->va_blocksize = MAXBSIZE;
729
730 (void) memcpy(vap, rvap, sizeof(struct vattr));
731 vap->va_fsid = mp->mnt_stat.f_fsidx.__fsid_val[0];
732
733 pn = VPTOPP(vp);
734 if (pn->pn_stat & PNODE_METACACHE_ATIME)
735 vap->va_atime = pn->pn_mc_atime;
736 if (pn->pn_stat & PNODE_METACACHE_CTIME)
737 vap->va_ctime = pn->pn_mc_ctime;
738 if (pn->pn_stat & PNODE_METACACHE_MTIME)
739 vap->va_mtime = pn->pn_mc_mtime;
740 if (pn->pn_stat & PNODE_METACACHE_SIZE) {
741 vap->va_size = pn->pn_mc_size;
742 } else {
743 if (rvap->va_size != VNOVAL
744 && vp->v_type != VBLK && vp->v_type != VCHR)
745 uvm_vnp_setsize(vp, rvap->va_size);
746 }
747
748 return 0;
749 }
750
751 int
752 puffs_setattr(void *v)
753 {
754 struct vop_getattr_args /* {
755 const struct vnodeop_desc *a_desc;
756 struct vnode *a_vp;
757 struct vattr *a_vap;
758 kauth_cred_t a_cred;
759 struct lwp *a_l;
760 } */ *ap = v;
761 int error;
762 struct vattr *vap = ap->a_vap;
763 struct puffs_node *pn = ap->a_vp->v_data;
764
765 PUFFS_VNREQ(setattr);
766
767 /*
768 * Flush metacache first. If we are called with some explicit
769 * parameters, treat them as information overriding metacache
770 * information.
771 */
772 if (pn->pn_stat & PNODE_METACACHE_MASK) {
773 if ((pn->pn_stat & PNODE_METACACHE_ATIME)
774 && vap->va_atime.tv_sec == VNOVAL)
775 vap->va_atime = pn->pn_mc_atime;
776 if ((pn->pn_stat & PNODE_METACACHE_CTIME)
777 && vap->va_ctime.tv_sec == VNOVAL)
778 vap->va_ctime = pn->pn_mc_ctime;
779 if ((pn->pn_stat & PNODE_METACACHE_MTIME)
780 && vap->va_mtime.tv_sec == VNOVAL)
781 vap->va_mtime = pn->pn_mc_mtime;
782 if ((pn->pn_stat & PNODE_METACACHE_SIZE)
783 && vap->va_size == VNOVAL)
784 vap->va_size = pn->pn_mc_size;
785
786 pn->pn_stat &= ~PNODE_METACACHE_MASK;
787 }
788
789 (void)memcpy(&setattr_arg.pvnr_va, vap, sizeof(struct vattr));
790 puffs_credcvt(&setattr_arg.pvnr_cred, ap->a_cred);
791 setattr_arg.pvnr_pid = puffs_lwp2pid(ap->a_l);
792
793 error = puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount), PUFFS_VN_SETATTR,
794 &setattr_arg, sizeof(setattr_arg), 0, ap->a_vp, NULL);
795 if (error)
796 return error;
797
798 if (vap->va_size != VNOVAL)
799 uvm_vnp_setsize(ap->a_vp, vap->va_size);
800
801 return 0;
802 }
803
804 int
805 puffs_inactive(void *v)
806 {
807 struct vop_inactive_args /* {
808 const struct vnodeop_desc *a_desc;
809 struct vnode *a_vp;
810 struct lwp *a_l;
811 } */ *ap = v;
812 struct puffs_mount *pmp;
813 struct puffs_node *pnode;
814 int rv, vnrefs, call;
815
816 PUFFS_VNREQ(inactive);
817
818 /*
819 * XXX: think about this after we really start unlocking
820 * when going to userspace
821 */
822 pnode = ap->a_vp->v_data;
823
824 pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
825
826 inactive_arg.pvnr_pid = puffs_lwp2pid(ap->a_l);
827
828 if (EXISTSOP(pmp, INACTIVE))
829 if (pmp->pmp_flags & PUFFS_KFLAG_IAONDEMAND)
830 if ((pnode->pn_stat & PNODE_DOINACT) || ALLOPS(pmp))
831 call = 1;
832 else
833 call = 0;
834 else
835 call = 1;
836 else
837 call = 0;
838
839 if (call)
840 rv = puffs_vntouser(pmp, PUFFS_VN_INACTIVE,
841 &inactive_arg, sizeof(inactive_arg), 0, ap->a_vp, NULL);
842 else
843 rv = 1; /* see below */
844 pnode->pn_stat &= ~PNODE_DOINACT;
845
846 /* can't trust userspace return value? simulate safe answer */
847 if (rv)
848 vnrefs = 1;
849 else
850 vnrefs = inactive_arg.pvnr_backendrefs;
851
852 VOP_UNLOCK(ap->a_vp, 0);
853
854 /*
855 * user server thinks it's gone? then don't be afraid care,
856 * node's life was already all it would ever be
857 */
858 if (vnrefs == 0 || (pnode->pn_stat & PNODE_NOREFS)) {
859 pnode->pn_stat |= PNODE_DYING;
860 vrecycle(ap->a_vp, NULL, ap->a_l);
861 }
862
863 return 0;
864 }
865
866 /*
867 * always FAF, we don't really care if the server wants to fail to
868 * reclaim the node or not
869 */
870 int
871 puffs_reclaim(void *v)
872 {
873 struct vop_reclaim_args /* {
874 const struct vnodeop_desc *a_desc;
875 struct vnode *a_vp;
876 struct lwp *a_l;
877 } */ *ap = v;
878 struct puffs_mount *pmp;
879 struct puffs_vnreq_reclaim *reclaim_argp;
880
881 pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
882
883 /*
884 * first things first: check if someone is trying to reclaim the
885 * root vnode. do not allow that to travel to userspace.
886 * Note that we don't need to take the lock similarly to
887 * puffs_root(), since there is only one of us.
888 */
889 if (ap->a_vp->v_flag & VROOT) {
890 mutex_enter(&pmp->pmp_lock);
891 KASSERT(pmp->pmp_root != NULL);
892 pmp->pmp_root = NULL;
893 mutex_exit(&pmp->pmp_lock);
894 goto out;
895 }
896
897 if (!EXISTSOP(pmp, RECLAIM))
898 goto out;
899
900 reclaim_argp = malloc(sizeof(struct puffs_vnreq_reclaim),
901 M_PUFFS, M_WAITOK | M_ZERO);
902 reclaim_argp->pvnr_pid = puffs_lwp2pid(ap->a_l);
903
904 puffs_vntouser_faf(pmp, PUFFS_VN_RECLAIM,
905 reclaim_argp, sizeof(struct puffs_vnreq_reclaim), ap->a_vp);
906
907 out:
908 if (PUFFS_DOCACHE(pmp))
909 cache_purge(ap->a_vp);
910 puffs_putvnode(ap->a_vp);
911
912 return 0;
913 }
914
915 #define CSIZE sizeof(**ap->a_cookies)
916 int
917 puffs_readdir(void *v)
918 {
919 struct vop_readdir_args /* {
920 const struct vnodeop_desc *a_desc;
921 struct vnode *a_vp;
922 struct uio *a_uio;
923 kauth_cred_t a_cred;
924 int *a_eofflag;
925 off_t **a_cookies;
926 int *a_ncookies;
927 } */ *ap = v;
928 struct puffs_mount *pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
929 struct puffs_vnreq_readdir *readdir_argp;
930 size_t argsize, tomove, cookiemem, cookiesmax;
931 struct uio *uio = ap->a_uio;
932 size_t howmuch;
933 int error;
934
935 if (ap->a_cookies) {
936 KASSERT(ap->a_ncookies != NULL);
937 if (pmp->pmp_args.pa_fhsize == 0)
938 return EOPNOTSUPP;
939 cookiesmax = uio->uio_resid/_DIRENT_MINSIZE((struct dirent *)0);
940 cookiemem = ALIGN(cookiesmax*CSIZE); /* play safe */
941 } else {
942 cookiesmax = 0;
943 cookiemem = 0;
944 }
945
946 argsize = sizeof(struct puffs_vnreq_readdir);
947 tomove = uio->uio_resid + cookiemem;
948 readdir_argp = malloc(argsize + tomove, M_PUFFS, M_ZERO | M_WAITOK);
949
950 puffs_credcvt(&readdir_argp->pvnr_cred, ap->a_cred);
951 readdir_argp->pvnr_offset = uio->uio_offset;
952 readdir_argp->pvnr_resid = uio->uio_resid;
953 readdir_argp->pvnr_ncookies = cookiesmax;
954 readdir_argp->pvnr_eofflag = 0;
955 readdir_argp->pvnr_dentoff = cookiemem;
956
957 error = puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount),
958 PUFFS_VN_READDIR, readdir_argp, argsize, tomove,
959 ap->a_vp, NULL);
960 if (error)
961 goto out;
962
963 /* userspace is cheating? */
964 if (readdir_argp->pvnr_resid > uio->uio_resid
965 || readdir_argp->pvnr_ncookies > cookiesmax) {
966 error = EINVAL;
967 goto out;
968 }
969
970 /* check eof */
971 if (readdir_argp->pvnr_eofflag)
972 *ap->a_eofflag = 1;
973
974 /* bouncy-wouncy with the directory data */
975 howmuch = uio->uio_resid - readdir_argp->pvnr_resid;
976
977 /* force eof if no data was returned (getcwd() needs this) */
978 if (howmuch == 0) {
979 *ap->a_eofflag = 1;
980 goto out;
981 }
982
983 error = uiomove(readdir_argp->pvnr_data + cookiemem, howmuch, uio);
984 if (error)
985 goto out;
986
987 /* provide cookies to caller if so desired */
988 if (ap->a_cookies) {
989 *ap->a_cookies = malloc(readdir_argp->pvnr_ncookies*CSIZE,
990 M_TEMP, M_WAITOK);
991 *ap->a_ncookies = readdir_argp->pvnr_ncookies;
992 memcpy(*ap->a_cookies, readdir_argp->pvnr_data,
993 *ap->a_ncookies*CSIZE);
994 }
995
996 /* next readdir starts here */
997 uio->uio_offset = readdir_argp->pvnr_offset;
998
999 out:
1000 free(readdir_argp, M_PUFFS);
1001 return error;
1002 }
1003 #undef CSIZE
1004
1005 /*
1006 * poll works by consuming the bitmask in pn_revents. If there are
1007 * events available, poll returns immediately. If not, it issues a
1008 * poll to userspace, selrecords itself and returns with no available
1009 * events. When the file server returns, it executes puffs_parkdone_poll(),
1010 * where available events are added to the bitmask. selnotify() is
1011 * then also executed by that function causing us to enter here again
1012 * and hopefully find the missing bits (unless someone got them first,
1013 * in which case it starts all over again).
1014 */
1015 int
1016 puffs_poll(void *v)
1017 {
1018 struct vop_poll_args /* {
1019 const struct vnodeop_desc *a_desc;
1020 struct vnode *a_vp;
1021 int a_events;
1022 struct lwp *a_l;
1023 }*/ *ap = v;
1024 struct vnode *vp = ap->a_vp;
1025 struct puffs_mount *pmp = MPTOPUFFSMP(vp->v_mount);
1026 struct puffs_vnreq_poll *poll_argp;
1027 struct puffs_node *pn = vp->v_data;
1028 int events;
1029
1030 if (EXISTSOP(pmp, POLL)) {
1031 mutex_enter(&pn->pn_mtx);
1032 events = pn->pn_revents & ap->a_events;
1033 if (events & ap->a_events) {
1034 pn->pn_revents &= ~ap->a_events;
1035 mutex_exit(&pn->pn_mtx);
1036
1037 return events;
1038 } else {
1039 puffs_referencenode(pn);
1040 mutex_exit(&pn->pn_mtx);
1041
1042 /* freed in puffs_parkdone_poll */
1043 poll_argp = malloc(sizeof(struct puffs_vnreq_poll),
1044 M_PUFFS, M_ZERO | M_WAITOK);
1045
1046 poll_argp->pvnr_events = ap->a_events;
1047 poll_argp->pvnr_pid = puffs_lwp2pid(ap->a_l);
1048
1049 selrecord(ap->a_l, &pn->pn_sel);
1050 puffs_vntouser_call(pmp, PUFFS_VN_POLL,
1051 poll_argp, sizeof(struct puffs_vnreq_poll), 0,
1052 puffs_parkdone_poll, pn,
1053 vp, NULL);
1054
1055 return 0;
1056 }
1057 } else {
1058 return genfs_poll(v);
1059 }
1060 }
1061
1062 int
1063 puffs_fsync(void *v)
1064 {
1065 struct vop_fsync_args /* {
1066 const struct vnodeop_desc *a_desc;
1067 struct vnode *a_vp;
1068 kauth_cred_t a_cred;
1069 int a_flags;
1070 off_t a_offlo;
1071 off_t a_offhi;
1072 struct lwp *a_l;
1073 } */ *ap = v;
1074 struct vattr va;
1075 struct puffs_mount *pmp;
1076 struct puffs_vnreq_fsync *fsync_argp;
1077 struct vnode *vp;
1078 struct puffs_node *pn;
1079 int pflags, error, dofaf;
1080
1081 PUFFS_VNREQ(fsync);
1082
1083 vp = ap->a_vp;
1084 pn = VPTOPP(vp);
1085 pmp = MPTOPUFFSMP(vp->v_mount);
1086
1087 /* flush out information from our metacache, see vop_setattr */
1088 if (pn->pn_stat & PNODE_METACACHE_MASK
1089 && (pn->pn_stat & PNODE_DYING) == 0) {
1090 vattr_null(&va);
1091 error = VOP_SETATTR(vp, &va, FSCRED, NULL);
1092 if (error)
1093 return error;
1094 }
1095
1096 /*
1097 * flush pages to avoid being overly dirty
1098 */
1099 pflags = PGO_CLEANIT;
1100 if (ap->a_flags & FSYNC_WAIT)
1101 pflags |= PGO_SYNCIO;
1102 simple_lock(&vp->v_interlock);
1103 error = VOP_PUTPAGES(vp, trunc_page(ap->a_offlo),
1104 round_page(ap->a_offhi), pflags);
1105 if (error)
1106 return error;
1107
1108 /*
1109 * HELLO! We exit already here if the user server does not
1110 * support fsync OR if we should call fsync for a node which
1111 * has references neither in the kernel or the fs server.
1112 * Otherwise we continue to issue fsync() forward.
1113 */
1114 if (!EXISTSOP(pmp, FSYNC) || (pn->pn_stat & PNODE_DYING))
1115 return 0;
1116
1117 dofaf = (ap->a_flags & FSYNC_WAIT) == 0 || ap->a_flags == FSYNC_LAZY;
1118 /*
1119 * We abuse VXLOCK to mean "vnode is going to die", so we issue
1120 * only FAFs for those. Otherwise there's a danger of deadlock,
1121 * since the execution context here might be the user server
1122 * doing some operation on another fs, which in turn caused a
1123 * vnode to be reclaimed from the freelist for this fs.
1124 */
1125 if (dofaf == 0) {
1126 simple_lock(&vp->v_interlock);
1127 if (vp->v_flag & VXLOCK)
1128 dofaf = 1;
1129 simple_unlock(&vp->v_interlock);
1130 }
1131
1132 if (dofaf == 0) {
1133 fsync_argp = &fsync_arg;
1134 } else {
1135 fsync_argp = malloc(sizeof(struct puffs_vnreq_fsync),
1136 M_PUFFS, M_ZERO | M_NOWAIT);
1137 if (fsync_argp == NULL)
1138 return ENOMEM;
1139 }
1140
1141 puffs_credcvt(&fsync_argp->pvnr_cred, ap->a_cred);
1142 fsync_argp->pvnr_flags = ap->a_flags;
1143 fsync_argp->pvnr_offlo = ap->a_offlo;
1144 fsync_argp->pvnr_offhi = ap->a_offhi;
1145 fsync_argp->pvnr_pid = puffs_lwp2pid(ap->a_l);
1146
1147 /*
1148 * XXX: see comment at puffs_getattr about locking
1149 *
1150 * If we are not required to wait, do a FAF operation.
1151 * Otherwise block here.
1152 */
1153 if (dofaf == 0) {
1154 error = puffs_vntouser(MPTOPUFFSMP(vp->v_mount),
1155 PUFFS_VN_FSYNC, fsync_argp, sizeof(*fsync_argp), 0,
1156 vp, NULL);
1157 } else {
1158 /* FAF is always "succesful" */
1159 error = 0;
1160 puffs_vntouser_faf(MPTOPUFFSMP(vp->v_mount),
1161 PUFFS_VN_FSYNC, fsync_argp, sizeof(*fsync_argp), vp);
1162 }
1163
1164 return error;
1165 }
1166
1167 int
1168 puffs_seek(void *v)
1169 {
1170 struct vop_seek_args /* {
1171 const struct vnodeop_desc *a_desc;
1172 struct vnode *a_vp;
1173 off_t a_oldoff;
1174 off_t a_newoff;
1175 kauth_cred_t a_cred;
1176 } */ *ap = v;
1177
1178 PUFFS_VNREQ(seek);
1179
1180 seek_arg.pvnr_oldoff = ap->a_oldoff;
1181 seek_arg.pvnr_newoff = ap->a_newoff;
1182 puffs_credcvt(&seek_arg.pvnr_cred, ap->a_cred);
1183
1184 /*
1185 * XXX: seems like seek is called with an unlocked vp, but
1186 * it can't hurt to play safe
1187 */
1188 return puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount), PUFFS_VN_SEEK,
1189 &seek_arg, sizeof(seek_arg), 0, ap->a_vp, NULL);
1190 }
1191
1192 int
1193 puffs_remove(void *v)
1194 {
1195 struct vop_remove_args /* {
1196 const struct vnodeop_desc *a_desc;
1197 struct vnode *a_dvp;
1198 struct vnode *a_vp;
1199 struct componentname *a_cnp;
1200 } */ *ap = v;
1201 int error;
1202
1203 PUFFS_VNREQ(remove);
1204
1205 remove_arg.pvnr_cookie_targ = VPTOPNC(ap->a_vp);
1206 puffs_makecn(&remove_arg.pvnr_cn, ap->a_cnp);
1207
1208 error = puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount), PUFFS_VN_REMOVE,
1209 &remove_arg, sizeof(remove_arg), 0, ap->a_dvp, ap->a_vp);
1210
1211 vput(ap->a_vp);
1212 if (ap->a_dvp == ap->a_vp)
1213 vrele(ap->a_dvp);
1214 else
1215 vput(ap->a_dvp);
1216
1217 return error;
1218 }
1219
1220 int
1221 puffs_mkdir(void *v)
1222 {
1223 struct vop_mkdir_args /* {
1224 const struct vnodeop_desc *a_desc;
1225 struct vnode *a_dvp;
1226 struct vnode **a_vpp;
1227 struct componentname *a_cnp;
1228 struct vattr *a_vap;
1229 } */ *ap = v;
1230 int error;
1231
1232 PUFFS_VNREQ(mkdir);
1233
1234 puffs_makecn(&mkdir_arg.pvnr_cn, ap->a_cnp);
1235 mkdir_arg.pvnr_va = *ap->a_vap;
1236
1237 error = puffs_vntouser(MPTOPUFFSMP(ap->a_dvp->v_mount), PUFFS_VN_MKDIR,
1238 &mkdir_arg, sizeof(mkdir_arg), 0, ap->a_dvp, NULL);
1239 if (error)
1240 goto out;
1241
1242 error = puffs_newnode(ap->a_dvp->v_mount, ap->a_dvp, ap->a_vpp,
1243 mkdir_arg.pvnr_newnode, ap->a_cnp, VDIR, 0);
1244
1245 out:
1246 if (error || (ap->a_cnp->cn_flags & SAVESTART) == 0)
1247 PNBUF_PUT(ap->a_cnp->cn_pnbuf);
1248 vput(ap->a_dvp);
1249 return error;
1250 }
1251
1252 int
1253 puffs_rmdir(void *v)
1254 {
1255 struct vop_rmdir_args /* {
1256 const struct vnodeop_desc *a_desc;
1257 struct vnode *a_dvp;
1258 struct vnode *a_vp;
1259 struct componentname *a_cnp;
1260 } */ *ap = v;
1261 int error;
1262
1263 PUFFS_VNREQ(rmdir);
1264
1265 rmdir_arg.pvnr_cookie_targ = VPTOPNC(ap->a_vp);
1266 puffs_makecn(&rmdir_arg.pvnr_cn, ap->a_cnp);
1267
1268 error = puffs_vntouser(MPTOPUFFSMP(ap->a_dvp->v_mount), PUFFS_VN_RMDIR,
1269 &rmdir_arg, sizeof(rmdir_arg), 0, ap->a_dvp, ap->a_vp);
1270
1271 /* XXX: some call cache_purge() *for both vnodes* here, investigate */
1272
1273 vput(ap->a_dvp);
1274 vput(ap->a_vp);
1275
1276 return error;
1277 }
1278
1279 int
1280 puffs_link(void *v)
1281 {
1282 struct vop_link_args /* {
1283 const struct vnodeop_desc *a_desc;
1284 struct vnode *a_dvp;
1285 struct vnode *a_vp;
1286 struct componentname *a_cnp;
1287 }*/ *ap = v;
1288 int error;
1289
1290 PUFFS_VNREQ(link);
1291
1292 link_arg.pvnr_cookie_targ = VPTOPNC(ap->a_vp);
1293 puffs_makecn(&link_arg.pvnr_cn, ap->a_cnp);
1294
1295 error = puffs_vntouser(MPTOPUFFSMP(ap->a_dvp->v_mount), PUFFS_VN_LINK,
1296 &link_arg, sizeof(link_arg), 0, ap->a_dvp, ap->a_vp);
1297
1298 /*
1299 * XXX: stay in touch with the cache. I don't like this, but
1300 * don't have a better solution either. See also puffs_rename().
1301 */
1302 if (error == 0)
1303 puffs_updatenode(ap->a_vp, PUFFS_UPDATECTIME);
1304
1305 vput(ap->a_dvp);
1306
1307 return error;
1308 }
1309
1310 int
1311 puffs_symlink(void *v)
1312 {
1313 struct vop_symlink_args /* {
1314 const struct vnodeop_desc *a_desc;
1315 struct vnode *a_dvp;
1316 struct vnode **a_vpp;
1317 struct componentname *a_cnp;
1318 struct vattr *a_vap;
1319 char *a_target;
1320 }*/ *ap = v;
1321 int error;
1322
1323 PUFFS_VNREQ(symlink); /* XXX: large structure */
1324
1325 *ap->a_vpp = NULL;
1326
1327 puffs_makecn(&symlink_arg.pvnr_cn, ap->a_cnp);
1328 symlink_arg.pvnr_va = *ap->a_vap;
1329 (void)strlcpy(symlink_arg.pvnr_link, ap->a_target,
1330 sizeof(symlink_arg.pvnr_link));
1331
1332 error = puffs_vntouser(MPTOPUFFSMP(ap->a_dvp->v_mount),
1333 PUFFS_VN_SYMLINK, &symlink_arg, sizeof(symlink_arg), 0,
1334 ap->a_dvp, NULL);
1335 if (error)
1336 goto out;
1337
1338 error = puffs_newnode(ap->a_dvp->v_mount, ap->a_dvp, ap->a_vpp,
1339 symlink_arg.pvnr_newnode, ap->a_cnp, VLNK, 0);
1340
1341 out:
1342 if (error || (ap->a_cnp->cn_flags & SAVESTART) == 0)
1343 PNBUF_PUT(ap->a_cnp->cn_pnbuf);
1344 vput(ap->a_dvp);
1345 return error;
1346 }
1347
1348 int
1349 puffs_readlink(void *v)
1350 {
1351 struct vop_readlink_args /* {
1352 const struct vnodeop_desc *a_desc;
1353 struct vnode *a_vp;
1354 struct uio *a_uio;
1355 kauth_cred_t a_cred;
1356 } */ *ap = v;
1357 size_t linklen;
1358 int error;
1359
1360 PUFFS_VNREQ(readlink);
1361
1362 puffs_credcvt(&readlink_arg.pvnr_cred, ap->a_cred);
1363 linklen = sizeof(readlink_arg.pvnr_link);
1364 readlink_arg.pvnr_linklen = linklen;
1365
1366 error = puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount),
1367 PUFFS_VN_READLINK, &readlink_arg, sizeof(readlink_arg), 0,
1368 ap->a_vp, NULL);
1369 if (error)
1370 return error;
1371
1372 /* bad bad user file server */
1373 if (readlink_arg.pvnr_linklen > linklen)
1374 return EINVAL;
1375
1376 return uiomove(&readlink_arg.pvnr_link, readlink_arg.pvnr_linklen,
1377 ap->a_uio);
1378 }
1379
1380 /* XXXXXXX: think about locking & userspace op delocking... */
1381 int
1382 puffs_rename(void *v)
1383 {
1384 struct vop_rename_args /* {
1385 const struct vnodeop_desc *a_desc;
1386 struct vnode *a_fdvp;
1387 struct vnode *a_fvp;
1388 struct componentname *a_fcnp;
1389 struct vnode *a_tdvp;
1390 struct vnode *a_tvp;
1391 struct componentname *a_tcnp;
1392 }*/ *ap = v;
1393 int error;
1394
1395 PUFFS_VNREQ(rename);
1396
1397 if (ap->a_fvp->v_mount != ap->a_tdvp->v_mount) {
1398 error = EXDEV;
1399 goto out;
1400 }
1401
1402 rename_arg.pvnr_cookie_src = VPTOPNC(ap->a_fvp);
1403 rename_arg.pvnr_cookie_targdir = VPTOPNC(ap->a_tdvp);
1404 if (ap->a_tvp)
1405 rename_arg.pvnr_cookie_targ = VPTOPNC(ap->a_tvp);
1406 else
1407 rename_arg.pvnr_cookie_targ = NULL;
1408 puffs_makecn(&rename_arg.pvnr_cn_src, ap->a_fcnp);
1409 puffs_makecn(&rename_arg.pvnr_cn_targ, ap->a_tcnp);
1410
1411 error = puffs_vntouser(MPTOPUFFSMP(ap->a_fdvp->v_mount),
1412 PUFFS_VN_RENAME, &rename_arg, sizeof(rename_arg), 0,
1413 ap->a_fdvp, NULL); /* XXX */
1414
1415 /*
1416 * XXX: stay in touch with the cache. I don't like this, but
1417 * don't have a better solution either. See also puffs_link().
1418 */
1419 if (error == 0)
1420 puffs_updatenode(ap->a_fvp, PUFFS_UPDATECTIME);
1421
1422 out:
1423 if (ap->a_tvp != NULL)
1424 vput(ap->a_tvp);
1425 if (ap->a_tdvp == ap->a_tvp)
1426 vrele(ap->a_tdvp);
1427 else
1428 vput(ap->a_tdvp);
1429
1430 vrele(ap->a_fdvp);
1431 vrele(ap->a_fvp);
1432
1433 return error;
1434 }
1435
1436 int
1437 puffs_read(void *v)
1438 {
1439 struct vop_read_args /* {
1440 const struct vnodeop_desc *a_desc;
1441 struct vnode *a_vp;
1442 struct uio *a_uio;
1443 int a_ioflag;
1444 kauth_cred_t a_cred;
1445 } */ *ap = v;
1446 struct puffs_vnreq_read *read_argp;
1447 struct puffs_mount *pmp;
1448 struct vnode *vp;
1449 struct uio *uio;
1450 void *win;
1451 size_t tomove, argsize;
1452 vsize_t bytelen;
1453 int error, ubcflags;
1454
1455 uio = ap->a_uio;
1456 vp = ap->a_vp;
1457 read_argp = NULL;
1458 error = 0;
1459 pmp = MPTOPUFFSMP(vp->v_mount);
1460
1461 /* std sanity */
1462 if (uio->uio_resid == 0)
1463 return 0;
1464 if (uio->uio_offset < 0)
1465 return EINVAL;
1466
1467 if (vp->v_type == VREG && PUFFS_DOCACHE(pmp)) {
1468 const int advice = IO_ADV_DECODE(ap->a_ioflag);
1469
1470 ubcflags = 0;
1471 if (UBC_WANT_UNMAP(vp))
1472 ubcflags = UBC_UNMAP;
1473
1474 while (uio->uio_resid > 0) {
1475 bytelen = MIN(uio->uio_resid,
1476 vp->v_size - uio->uio_offset);
1477 if (bytelen == 0)
1478 break;
1479
1480 win = ubc_alloc(&vp->v_uobj, uio->uio_offset,
1481 &bytelen, advice, UBC_READ);
1482 error = uiomove(win, bytelen, uio);
1483 ubc_release(win, ubcflags);
1484 if (error)
1485 break;
1486 }
1487
1488 if ((vp->v_mount->mnt_flag & MNT_NOATIME) == 0)
1489 puffs_updatenode(vp, PUFFS_UPDATEATIME);
1490 } else {
1491 /*
1492 * in case it's not a regular file or we're operating
1493 * uncached, do read in the old-fashioned style,
1494 * i.e. explicit read operations
1495 */
1496
1497 tomove = PUFFS_TOMOVE(uio->uio_resid, pmp);
1498 argsize = sizeof(struct puffs_vnreq_read);
1499 read_argp = malloc(argsize + tomove,
1500 M_PUFFS, M_WAITOK | M_ZERO);
1501
1502 error = 0;
1503 while (uio->uio_resid > 0) {
1504 read_argp->pvnr_ioflag = ap->a_ioflag;
1505 read_argp->pvnr_resid = tomove;
1506 read_argp->pvnr_offset = uio->uio_offset;
1507 puffs_credcvt(&read_argp->pvnr_cred, ap->a_cred);
1508
1509 argsize = sizeof(struct puffs_vnreq_read);
1510 error = puffs_vntouser(pmp, PUFFS_VN_READ,
1511 read_argp, argsize, tomove,
1512 ap->a_vp, NULL);
1513 if (error)
1514 break;
1515
1516 if (read_argp->pvnr_resid > tomove) {
1517 error = EINVAL;
1518 break;
1519 }
1520
1521 error = uiomove(read_argp->pvnr_data,
1522 tomove - read_argp->pvnr_resid, uio);
1523
1524 /*
1525 * in case the file is out of juice, resid from
1526 * userspace is != 0. and the error-case is
1527 * quite obvious
1528 */
1529 if (error || read_argp->pvnr_resid)
1530 break;
1531
1532 tomove = PUFFS_TOMOVE(uio->uio_resid, pmp);
1533 }
1534 }
1535
1536 if (read_argp)
1537 free(read_argp, M_PUFFS);
1538 return error;
1539 }
1540
1541 int
1542 puffs_write(void *v)
1543 {
1544 struct vop_write_args /* {
1545 const struct vnodeop_desc *a_desc;
1546 struct vnode *a_vp;
1547 struct uio *a_uio;
1548 int a_ioflag;
1549 kauth_cred_t a_cred;
1550 } */ *ap = v;
1551 struct puffs_vnreq_write *write_argp;
1552 struct puffs_mount *pmp;
1553 struct uio *uio;
1554 struct vnode *vp;
1555 void *win;
1556 size_t tomove, argsize;
1557 off_t oldoff, newoff, origoff;
1558 vsize_t bytelen;
1559 int error, uflags;
1560 int ubcflags;
1561
1562 vp = ap->a_vp;
1563 uio = ap->a_uio;
1564 error = uflags = 0;
1565 write_argp = NULL;
1566 pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
1567
1568 if (vp->v_type == VREG && PUFFS_DOCACHE(pmp)) {
1569 ubcflags = 0;
1570 if (UBC_WANT_UNMAP(vp))
1571 ubcflags = UBC_UNMAP;
1572
1573 /*
1574 * userspace *should* be allowed to control this,
1575 * but with UBC it's a bit unclear how to handle it
1576 */
1577 if (ap->a_ioflag & IO_APPEND)
1578 uio->uio_offset = vp->v_size;
1579
1580 origoff = uio->uio_offset;
1581 while (uio->uio_resid > 0) {
1582 uflags |= PUFFS_UPDATECTIME;
1583 uflags |= PUFFS_UPDATEMTIME;
1584 oldoff = uio->uio_offset;
1585 bytelen = uio->uio_resid;
1586
1587 win = ubc_alloc(&vp->v_uobj, oldoff, &bytelen,
1588 UVM_ADV_NORMAL, UBC_WRITE);
1589 error = uiomove(win, bytelen, uio);
1590
1591 /*
1592 * There is no guarantee that the faults
1593 * generated by uiomove() succeed at all.
1594 * Therefore, in case of an uiomove() error,
1595 * opt to not extend the file at all and
1596 * return an error. Otherwise, if we attempt
1597 * to clear the memory we couldn't fault to,
1598 * we might generate a kernel page fault.
1599 */
1600 newoff = oldoff + bytelen;
1601 if (vp->v_size < newoff && error == 0) {
1602 uflags |= PUFFS_UPDATESIZE;
1603 uvm_vnp_setsize(vp, newoff);
1604 }
1605
1606 ubc_release(win, ubcflags);
1607 if (error)
1608 break;
1609
1610 /*
1611 * If we're writing large files, flush to file server
1612 * every 64k. Otherwise we can very easily exhaust
1613 * kernel and user memory, as the file server cannot
1614 * really keep up with our writing speed.
1615 *
1616 * Note: this does *NOT* honor MNT_ASYNC, because
1617 * that gives userland too much say in the kernel.
1618 */
1619 if (oldoff >> 16 != uio->uio_offset >> 16) {
1620 simple_lock(&vp->v_interlock);
1621 error = VOP_PUTPAGES(vp, oldoff & ~0xffff,
1622 uio->uio_offset & ~0xffff,
1623 PGO_CLEANIT | PGO_SYNCIO);
1624 if (error)
1625 break;
1626 }
1627 }
1628
1629 /* synchronous I/O? */
1630 if (error == 0 && ap->a_ioflag & IO_SYNC) {
1631 simple_lock(&vp->v_interlock);
1632 error = VOP_PUTPAGES(vp, trunc_page(origoff),
1633 round_page(uio->uio_offset),
1634 PGO_CLEANIT | PGO_SYNCIO);
1635
1636 /* write though page cache? */
1637 } else if (error == 0 && pmp->pmp_flags & PUFFS_KFLAG_WTCACHE) {
1638 simple_lock(&vp->v_interlock);
1639 error = VOP_PUTPAGES(vp, trunc_page(origoff),
1640 round_page(uio->uio_offset), PGO_CLEANIT);
1641 }
1642
1643 puffs_updatenode(vp, uflags);
1644 } else {
1645 /* tomove is non-increasing */
1646 tomove = PUFFS_TOMOVE(uio->uio_resid, pmp);
1647 argsize = sizeof(struct puffs_vnreq_write) + tomove;
1648 write_argp = malloc(argsize, M_PUFFS, M_WAITOK | M_ZERO);
1649
1650 while (uio->uio_resid > 0) {
1651 write_argp->pvnr_ioflag = ap->a_ioflag;
1652 write_argp->pvnr_resid = tomove;
1653 write_argp->pvnr_offset = uio->uio_offset;
1654 puffs_credcvt(&write_argp->pvnr_cred, ap->a_cred);
1655 error = uiomove(write_argp->pvnr_data, tomove, uio);
1656 if (error)
1657 break;
1658
1659 error = puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount),
1660 PUFFS_VN_WRITE, write_argp, argsize, 0,
1661 ap->a_vp, NULL);
1662 if (error) {
1663 /* restore uiomove */
1664 uio->uio_resid += tomove;
1665 uio->uio_offset -= tomove;
1666 break;
1667 }
1668 if (write_argp->pvnr_resid > tomove) {
1669 /*
1670 * XXX: correct file size is a mystery,
1671 * we can only guess
1672 */
1673 error = EINVAL;
1674 break;
1675 }
1676
1677 /* adjust file size */
1678 if (vp->v_size < uio->uio_offset)
1679 uvm_vnp_setsize(vp, uio->uio_offset);
1680
1681 /* didn't move everything? bad userspace. bail */
1682 if (write_argp->pvnr_resid != 0) {
1683 uio->uio_resid += write_argp->pvnr_resid;
1684 uio->uio_offset -= write_argp->pvnr_resid;
1685 error = EIO;
1686 break;
1687 }
1688
1689 tomove = PUFFS_TOMOVE(uio->uio_resid, pmp);
1690 }
1691 }
1692
1693 if (write_argp)
1694 free(write_argp, M_PUFFS);
1695 return error;
1696 }
1697
1698 static int puffs_fcnioctl(struct vop_ioctl_args * /*XXX*/, int);
1699
1700 #define FCNIOCTL_ARG_MAX 1<<16
1701 int
1702 puffs_fcnioctl(struct vop_ioctl_args *ap, int puffsop)
1703 {
1704
1705 /* currently not supported */
1706 return EOPNOTSUPP;
1707 #if 0
1708 /* struct vop_ioctl_args {
1709 const struct vnodeop_desc *a_desc;
1710 struct vnode *a_vp;
1711 u_long a_command;
1712 void *a_data;
1713 int a_fflag;
1714 kauth_cred_t a_cred;
1715 struct lwp *a_l;
1716 }*ap = v; */
1717 struct puffs_mount *pmp;
1718 struct puffs_sizepark pspark;
1719 void *kernbuf;
1720 size_t copylen;
1721 int error;
1722
1723 PUFFS_VNREQ(fcnioctl);
1724
1725 /*
1726 * Since this op gives the filesystem (almost) complete control on
1727 * how much it is allowed to copy from the calling process
1728 * address space, do not enable it by default, since it would
1729 * be a whopping security hole.
1730 */
1731 pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
1732 if ((pmp->pmp_flags & PUFFS_KFLAG_ALLOWCTL) == 0)
1733 return EINVAL; /* only shoe that fits */
1734
1735 /* fill in sizereq and store it */
1736 pspark.pkso_reqid = puffs_getreqid(pmp);
1737 pspark.pkso_reqtype = PUFFS_SIZEOPREQ_BUF_IN;
1738 pspark.pkso_copybuf = ap->a_data;
1739 pspark.pkso_bufsize = FCNIOCTL_ARG_MAX;
1740 TAILQ_INSERT_TAIL(&pmp->pmp_req_sizepark, &pspark, pkso_entries);
1741
1742 /* then fill in actual request and shoot it off */
1743 fcnioctl_arg.pvnr_command = ap->a_command;
1744 fcnioctl_arg.pvnr_fflag = ap->a_fflag;
1745 puffs_credcvt(&fcnioctl_arg.pvnr_cred, ap->a_cred);
1746 fcnioctl_arg.pvnr_pid = puffs_lwp2pid(ap->a_l);
1747
1748 error = puffs_vntouser_req(MPTOPUFFSMP(ap->a_vp->v_mount), puffsop,
1749 &fcnioctl_arg, sizeof(fcnioctl_arg), 0, ap->a_vp,
1750 pspark.pkso_reqid, ap->a_vp, NULL);
1751
1752 /* if we don't need to copy data, we're done */
1753 if (error || !fcnioctl_arg.pvnr_copyback)
1754 return error;
1755
1756 copylen = MIN(FCNIOCTL_ARG_MAX, fcnioctl_arg.pvnr_datalen);
1757 kernbuf = malloc(copylen, M_PUFFS, M_WAITOK);
1758 error = copyin(fcnioctl_arg.pvnr_data, kernbuf, copylen);
1759 if (error)
1760 goto out;
1761 error = copyout(kernbuf, ap->a_data, copylen);
1762
1763 out:
1764 free(kernbuf, M_PUFFS);
1765 return error;
1766 #endif
1767 }
1768
1769 int
1770 puffs_ioctl(void *v)
1771 {
1772
1773 return puffs_fcnioctl(v, PUFFS_VN_IOCTL);
1774 }
1775
1776 int
1777 puffs_fcntl(void *v)
1778 {
1779
1780 return puffs_fcnioctl(v, PUFFS_VN_FCNTL);
1781 }
1782
1783 int
1784 puffs_print(void *v)
1785 {
1786 struct vop_print_args /* {
1787 struct vnode *a_vp;
1788 } */ *ap = v;
1789 struct puffs_mount *pmp;
1790 struct vnode *vp = ap->a_vp;
1791 struct puffs_node *pn = vp->v_data;
1792
1793 PUFFS_VNREQ(print);
1794
1795 pmp = MPTOPUFFSMP(vp->v_mount);
1796
1797 /* kernel portion */
1798 printf("tag VT_PUFFS, vnode %p, puffs node: %p,\n"
1799 " userspace cookie: %p\n", vp, pn, pn->pn_cookie);
1800 if (vp->v_type == VFIFO)
1801 fifo_printinfo(vp);
1802 lockmgr_printinfo(&vp->v_lock);
1803
1804 /* userspace portion */
1805 if (EXISTSOP(pmp, PRINT))
1806 puffs_vntouser(pmp, PUFFS_VN_PRINT,
1807 &print_arg, sizeof(print_arg), 0, ap->a_vp, NULL);
1808
1809 return 0;
1810 }
1811
1812 int
1813 puffs_pathconf(void *v)
1814 {
1815 struct vop_pathconf_args /* {
1816 const struct vnodeop_desc *a_desc;
1817 struct vnode *a_vp;
1818 int a_name;
1819 register_t *a_retval;
1820 } */ *ap = v;
1821 int error;
1822
1823 PUFFS_VNREQ(pathconf);
1824
1825 pathconf_arg.pvnr_name = ap->a_name;
1826
1827 error = puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount),
1828 PUFFS_VN_PATHCONF, &pathconf_arg, sizeof(pathconf_arg), 0,
1829 ap->a_vp, NULL);
1830 if (error)
1831 return error;
1832
1833 *ap->a_retval = pathconf_arg.pvnr_retval;
1834
1835 return 0;
1836 }
1837
1838 int
1839 puffs_advlock(void *v)
1840 {
1841 struct vop_advlock_args /* {
1842 const struct vnodeop_desc *a_desc;
1843 struct vnode *a_vp;
1844 void *a_id;
1845 int a_op;
1846 struct flock *a_fl;
1847 int a_flags;
1848 } */ *ap = v;
1849 int error;
1850
1851 PUFFS_VNREQ(advlock);
1852
1853 error = copyin(ap->a_fl, &advlock_arg.pvnr_fl, sizeof(struct flock));
1854 if (error)
1855 return error;
1856 advlock_arg.pvnr_id = ap->a_id;
1857 advlock_arg.pvnr_op = ap->a_op;
1858 advlock_arg.pvnr_flags = ap->a_flags;
1859
1860 return puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount), PUFFS_VN_ADVLOCK,
1861 &advlock_arg, sizeof(advlock_arg), 0, ap->a_vp, NULL);
1862 }
1863 /*
1864 * This maps itself to PUFFS_VN_READ/WRITE for data transfer.
1865 */
1866 int
1867 puffs_strategy(void *v)
1868 {
1869 struct vop_strategy_args /* {
1870 const struct vnodeop_desc *a_desc;
1871 struct vnode *a_vp;
1872 struct buf *a_bp;
1873 } */ *ap = v;
1874 struct puffs_mount *pmp;
1875 struct vnode *vp = ap->a_vp;
1876 struct puffs_node *pn;
1877 struct puffs_vnreq_read *read_argp = NULL;
1878 struct puffs_vnreq_write *write_argp = NULL;
1879 struct buf *bp;
1880 size_t argsize;
1881 size_t tomove, moved;
1882 int error, dowritefaf;
1883
1884 pmp = MPTOPUFFSMP(vp->v_mount);
1885 bp = ap->a_bp;
1886 error = 0;
1887 dowritefaf = 0;
1888 pn = VPTOPP(vp);
1889
1890 if (((bp->b_flags & B_READ) && !EXISTSOP(pmp, READ))
1891 || (((bp->b_flags & B_READ) == 0) && !EXISTSOP(pmp, WRITE))) {
1892 error = EOPNOTSUPP;
1893 goto out;
1894 }
1895
1896 /*
1897 * Short-circuit optimization: don't flush buffer in between
1898 * VOP_INACTIVE and VOP_RECLAIM in case the node has no references.
1899 */
1900 if (pn->pn_stat & PNODE_DYING) {
1901 KASSERT((bp->b_flags & B_READ) == 0);
1902 bp->b_resid = 0;
1903 goto out;
1904 }
1905
1906 #ifdef DIAGNOSTIC
1907 if (bp->b_bcount > pmp->pmp_req_maxsize - PUFFS_REQSTRUCT_MAX)
1908 panic("puffs_strategy: wildly inappropriate buf bcount %d",
1909 bp->b_bcount);
1910 #endif
1911
1912 /*
1913 * See explanation for the necessity of a FAF in puffs_fsync.
1914 *
1915 * Also, do FAF in case we're suspending.
1916 * See puffs_vfsops.c:pageflush()
1917 *
1918 * XXgoddamnX: B_WRITE is a "pseudo flag"
1919 */
1920 if ((bp->b_flags & B_READ) == 0) {
1921 simple_lock(&vp->v_interlock);
1922 if (vp->v_flag & VXLOCK)
1923 dowritefaf = 1;
1924 if (pn->pn_stat & PNODE_SUSPEND)
1925 dowritefaf = 1;
1926 simple_unlock(&vp->v_interlock);
1927 }
1928
1929 if (bp->b_flags & B_ASYNC)
1930 dowritefaf = 1;
1931
1932 #ifdef DIAGNOSTIC
1933 if (curproc == uvm.pagedaemon_proc)
1934 KASSERT(dowritefaf);
1935 #endif
1936
1937 tomove = PUFFS_TOMOVE(bp->b_bcount, pmp);
1938
1939 if ((bp->b_flags & (B_READ | B_ASYNC)) == (B_READ | B_ASYNC)) {
1940 argsize = sizeof(struct puffs_vnreq_read);
1941 read_argp = malloc(argsize + tomove,
1942 M_PUFFS, M_NOWAIT | M_ZERO);
1943 if (read_argp == NULL) {
1944 error = ENOMEM;
1945 goto out;
1946 }
1947
1948 read_argp->pvnr_ioflag = 0;
1949 read_argp->pvnr_resid = tomove;
1950 read_argp->pvnr_offset = bp->b_blkno << DEV_BSHIFT;
1951 puffs_credcvt(&read_argp->pvnr_cred, FSCRED);
1952
1953 puffs_vntouser_call(pmp, PUFFS_VN_READ, read_argp,
1954 argsize, tomove, puffs_parkdone_asyncbioread, bp, vp, NULL);
1955 error = 0;
1956 goto wayout;
1957 } else if (bp->b_flags & B_READ) {
1958 argsize = sizeof(struct puffs_vnreq_read);
1959 read_argp = malloc(argsize + tomove,
1960 M_PUFFS, M_WAITOK | M_ZERO);
1961
1962 read_argp->pvnr_ioflag = 0;
1963 read_argp->pvnr_resid = tomove;
1964 read_argp->pvnr_offset = bp->b_blkno << DEV_BSHIFT;
1965 puffs_credcvt(&read_argp->pvnr_cred, FSCRED);
1966
1967 error = puffs_vntouser(pmp, PUFFS_VN_READ,
1968 read_argp, argsize, tomove, vp, NULL);
1969
1970 if (error)
1971 goto out;
1972
1973 if (read_argp->pvnr_resid > tomove) {
1974 error = EINVAL;
1975 goto out;
1976 }
1977
1978 moved = tomove - read_argp->pvnr_resid;
1979
1980 (void)memcpy(bp->b_data, read_argp->pvnr_data, moved);
1981 bp->b_resid = bp->b_bcount - moved;
1982 } else {
1983 /*
1984 * make pages read-only before we write them if we want
1985 * write caching info
1986 */
1987 if (PUFFS_WCACHEINFO(pmp)) {
1988 struct uvm_object *uobj = &vp->v_uobj;
1989 int npages = (bp->b_bcount + PAGE_SIZE-1) >> PAGE_SHIFT;
1990 struct vm_page *vmp;
1991 int i;
1992
1993 for (i = 0; i < npages; i++) {
1994 vmp= uvm_pageratop((vaddr_t)bp->b_data
1995 + (i << PAGE_SHIFT));
1996 DPRINTF(("puffs_strategy: write-protecting "
1997 "vp %p page %p, offset %" PRId64"\n",
1998 vp, vmp, vmp->offset));
1999 simple_lock(&uobj->vmobjlock);
2000 vmp->flags |= PG_RDONLY;
2001 pmap_page_protect(vmp, VM_PROT_READ);
2002 simple_unlock(&uobj->vmobjlock);
2003 }
2004 }
2005
2006 argsize = sizeof(struct puffs_vnreq_write) + bp->b_bcount;
2007 write_argp = malloc(argsize, M_PUFFS, M_NOWAIT | M_ZERO);
2008 if (write_argp == NULL) {
2009 error = ENOMEM;
2010 goto out;
2011 }
2012
2013 write_argp->pvnr_ioflag = 0;
2014 write_argp->pvnr_resid = tomove;
2015 write_argp->pvnr_offset = bp->b_blkno << DEV_BSHIFT;
2016 puffs_credcvt(&write_argp->pvnr_cred, FSCRED);
2017
2018 (void)memcpy(&write_argp->pvnr_data, bp->b_data, tomove);
2019
2020 if (dowritefaf) {
2021 /*
2022 * assume FAF moves everything. frankly, we don't
2023 * really have a choice.
2024 */
2025 puffs_vntouser_faf(MPTOPUFFSMP(vp->v_mount),
2026 PUFFS_VN_WRITE, write_argp, argsize, vp);
2027 bp->b_resid = bp->b_bcount - tomove;
2028 } else {
2029 error = puffs_vntouser(MPTOPUFFSMP(vp->v_mount),
2030 PUFFS_VN_WRITE, write_argp, argsize, 0, vp, NULL);
2031 if (error)
2032 goto out;
2033
2034 moved = tomove - write_argp->pvnr_resid;
2035 if (write_argp->pvnr_resid > tomove) {
2036 error = EINVAL;
2037 goto out;
2038 }
2039
2040 bp->b_resid = bp->b_bcount - moved;
2041 if (write_argp->pvnr_resid != 0)
2042 error = EIO;
2043 }
2044 }
2045
2046 out:
2047 if (read_argp)
2048 free(read_argp, M_PUFFS);
2049 if (write_argp && !dowritefaf)
2050 free(write_argp, M_PUFFS);
2051
2052 if (error) {
2053 bp->b_error = error;
2054 bp->b_flags |= B_ERROR;
2055 }
2056
2057 if (error || ((bp->b_flags & (B_READ | B_ASYNC)) != (B_READ | B_ASYNC)))
2058 biodone(bp);
2059 wayout:
2060 return error;
2061 }
2062
2063 int
2064 puffs_mmap(void *v)
2065 {
2066 struct vop_mmap_args /* {
2067 const struct vnodeop_desc *a_desc;
2068 struct vnode *a_vp;
2069 int a_fflags;
2070 kauth_cred_t a_cred;
2071 struct lwp *a_l;
2072 } */ *ap = v;
2073 struct puffs_mount *pmp;
2074 int error;
2075
2076 PUFFS_VNREQ(mmap);
2077
2078 pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
2079
2080 if (!PUFFS_DOCACHE(pmp))
2081 return genfs_eopnotsupp(v);
2082
2083 if (EXISTSOP(pmp, MMAP)) {
2084 mmap_arg.pvnr_fflags = ap->a_fflags;
2085 puffs_credcvt(&mmap_arg.pvnr_cred, ap->a_cred);
2086 mmap_arg.pvnr_pid = puffs_lwp2pid(ap->a_l);
2087
2088 error = puffs_vntouser(pmp, PUFFS_VN_MMAP,
2089 &mmap_arg, sizeof(mmap_arg), 0,
2090 ap->a_vp, NULL);
2091 } else {
2092 error = genfs_mmap(v);
2093 }
2094
2095 return error;
2096 }
2097
2098
2099 /*
2100 * The rest don't get a free trip to userspace and back, they
2101 * have to stay within the kernel.
2102 */
2103
2104 /*
2105 * bmap doesn't really make any sense for puffs, so just 1:1 map it.
2106 * well, maybe somehow, somewhere, some day ....
2107 */
2108 int
2109 puffs_bmap(void *v)
2110 {
2111 struct vop_bmap_args /* {
2112 const struct vnodeop_desc *a_desc;
2113 struct vnode *a_vp;
2114 daddr_t a_bn;
2115 struct vnode **a_vpp;
2116 daddr_t *a_bnp;
2117 int *a_runp;
2118 } */ *ap = v;
2119 struct puffs_mount *pmp;
2120
2121 pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
2122
2123 if (ap->a_vpp)
2124 *ap->a_vpp = ap->a_vp;
2125 if (ap->a_bnp)
2126 *ap->a_bnp = ap->a_bn;
2127 if (ap->a_runp)
2128 *ap->a_runp
2129 = (PUFFS_TOMOVE(pmp->pmp_req_maxsize, pmp)>>DEV_BSHIFT) - 1;
2130
2131 return 0;
2132 }
2133
2134 /*
2135 * Handle getpages faults in puffs. We let genfs_getpages() do most
2136 * of the dirty work, but we come in this route to do accounting tasks.
2137 * If the user server has specified functions for cache notifications
2138 * about reads and/or writes, we record which type of operation we got,
2139 * for which page range, and proceed to issue a FAF notification to the
2140 * server about it.
2141 */
2142 int
2143 puffs_getpages(void *v)
2144 {
2145 struct vop_getpages_args /* {
2146 const struct vnodeop_desc *a_desc;
2147 struct vnode *a_vp;
2148 voff_t a_offset;
2149 struct vm_page **a_m;
2150 int *a_count;
2151 int a_centeridx;
2152 vm_prot_t a_access_type;
2153 int a_advice;
2154 int a_flags;
2155 } */ *ap = v;
2156 struct puffs_mount *pmp;
2157 struct vnode *vp;
2158 struct vm_page **pgs;
2159 struct puffs_cacheinfo *pcinfo = NULL;
2160 struct puffs_cacherun *pcrun;
2161 void *parkmem = NULL;
2162 size_t runsizes;
2163 int i, npages, si, streakon;
2164 int error, locked, write;
2165
2166 pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
2167 npages = *ap->a_count;
2168 pgs = ap->a_m;
2169 vp = ap->a_vp;
2170 locked = (ap->a_flags & PGO_LOCKED) != 0;
2171 write = (ap->a_access_type & VM_PROT_WRITE) != 0;
2172
2173 /* ccg xnaht - gets Wuninitialized wrong */
2174 pcrun = NULL;
2175 runsizes = 0;
2176
2177 if (write && PUFFS_WCACHEINFO(pmp)) {
2178 /* allocate worst-case memory */
2179 runsizes = ((npages / 2) + 1) * sizeof(struct puffs_cacherun);
2180 pcinfo = malloc(sizeof(struct puffs_cacheinfo) + runsizes,
2181 M_PUFFS, M_ZERO | locked ? M_NOWAIT : M_WAITOK);
2182
2183 /*
2184 * can't block if we're locked and can't mess up caching
2185 * information for fs server. so come back later, please
2186 */
2187 if (pcinfo == NULL) {
2188 error = ENOMEM;
2189 goto out;
2190 }
2191
2192 parkmem = puffs_park_alloc(locked == 0);
2193 if (parkmem == NULL) {
2194 error = ENOMEM;
2195 goto out;
2196 }
2197
2198 pcrun = pcinfo->pcache_runs;
2199 }
2200
2201 error = genfs_getpages(v);
2202 if (error)
2203 goto out;
2204
2205 if (PUFFS_WCACHEINFO(pmp) == 0)
2206 goto out;
2207
2208 /*
2209 * Let's see whose fault it was and inform the user server of
2210 * possibly read/written pages. Map pages from read faults
2211 * strictly read-only, since otherwise we might miss info on
2212 * when the page is actually write-faulted to.
2213 */
2214 if (!locked)
2215 simple_lock(&vp->v_uobj.vmobjlock);
2216 for (i = 0, si = 0, streakon = 0; i < npages; i++) {
2217 if (pgs[i] == NULL || pgs[i] == PGO_DONTCARE) {
2218 if (streakon && write) {
2219 streakon = 0;
2220 pcrun[si].pcache_runend
2221 = trunc_page(pgs[i]->offset) + PAGE_MASK;
2222 si++;
2223 }
2224 continue;
2225 }
2226 if (streakon == 0 && write) {
2227 streakon = 1;
2228 pcrun[si].pcache_runstart = pgs[i]->offset;
2229 }
2230
2231 if (!write)
2232 pgs[i]->flags |= PG_RDONLY;
2233 }
2234 /* was the last page part of our streak? */
2235 if (streakon) {
2236 pcrun[si].pcache_runend
2237 = trunc_page(pgs[i-1]->offset) + PAGE_MASK;
2238 si++;
2239 }
2240 if (!locked)
2241 simple_unlock(&vp->v_uobj.vmobjlock);
2242
2243 KASSERT(si <= (npages / 2) + 1);
2244
2245 /* send results to userspace */
2246 if (write)
2247 puffs_cacheop(pmp, parkmem, pcinfo,
2248 sizeof(struct puffs_cacheinfo) + runsizes, VPTOPNC(vp));
2249
2250 out:
2251 if (error) {
2252 if (pcinfo != NULL)
2253 free(pcinfo, M_PUFFS);
2254 if (parkmem != NULL)
2255 puffs_park_release(parkmem, 1);
2256 }
2257
2258 return error;
2259 }
2260
2261 int
2262 puffs_lock(void *v)
2263 {
2264 struct vop_lock_args /* {
2265 struct vnode *a_vp;
2266 int a_flags;
2267 }*/ *ap = v;
2268 struct vnode *vp = ap->a_vp;
2269 struct mount *mp = vp->v_mount;
2270
2271 #if 0
2272 DPRINTF(("puffs_lock: lock %p, args 0x%x\n", vp, ap->a_flags));
2273 #endif
2274
2275 /*
2276 * XXX: this avoids deadlocking when we're suspending.
2277 * e.g. some ops holding the vnode lock might be blocked for
2278 * the vfs transaction lock so we'd deadlock.
2279 *
2280 * Now once again this is skating on the thin ice of modern life,
2281 * since we are breaking the consistency guarantee provided
2282 * _to the user server_ by vnode locking. Hopefully this will
2283 * get fixed soon enough by getting rid of the dependency on
2284 * vnode locks alltogether.
2285 */
2286 if (fstrans_is_owner(mp) && fstrans_getstate(mp) == FSTRANS_SUSPENDING){
2287 if (ap->a_flags & LK_INTERLOCK)
2288 simple_unlock(&vp->v_interlock);
2289 return 0;
2290 }
2291
2292 return lockmgr(&vp->v_lock, ap->a_flags, &vp->v_interlock);
2293 }
2294
2295 int
2296 puffs_unlock(void *v)
2297 {
2298 struct vop_unlock_args /* {
2299 struct vnode *a_vp;
2300 int a_flags;
2301 } */ *ap = v;
2302 struct vnode *vp = ap->a_vp;
2303 struct mount *mp = vp->v_mount;
2304
2305 #if 0
2306 DPRINTF(("puffs_unlock: lock %p, args 0x%x\n", vp, ap->a_flags));
2307 #endif
2308
2309 /* XXX: see puffs_lock() */
2310 if (fstrans_is_owner(mp) && fstrans_getstate(mp) == FSTRANS_SUSPENDING){
2311 if (ap->a_flags & LK_INTERLOCK)
2312 simple_unlock(&vp->v_interlock);
2313 return 0;
2314 }
2315
2316 return lockmgr(&vp->v_lock, ap->a_flags | LK_RELEASE, &vp->v_interlock);
2317 }
2318
2319 int
2320 puffs_islocked(void *v)
2321 {
2322 struct vop_islocked_args *ap = v;
2323 int rv;
2324
2325 rv = lockstatus(&ap->a_vp->v_lock);
2326 return rv;
2327 }
2328
2329 int
2330 puffs_generic(void *v)
2331 {
2332 struct vop_generic_args *ap = v;
2333
2334 (void)ap;
2335 DPRINTF(("puffs_generic: ap->a_desc = %s\n", ap->a_desc->vdesc_name));
2336
2337 return EOPNOTSUPP;
2338 }
2339
2340
2341 /*
2342 * spec & fifo. These call the miscfs spec and fifo vectors, but issue
2343 * FAF update information for the puffs node first.
2344 */
2345 int
2346 puffs_spec_read(void *v)
2347 {
2348 struct vop_read_args /* {
2349 const struct vnodeop_desc *a_desc;
2350 struct vnode *a_vp;
2351 struct uio *a_uio;
2352 int a_ioflag;
2353 kauth_cred_t a_cred;
2354 } */ *ap = v;
2355
2356 puffs_updatenode(ap->a_vp, PUFFS_UPDATEATIME);
2357 return VOCALL(spec_vnodeop_p, VOFFSET(vop_read), v);
2358 }
2359
2360 int
2361 puffs_spec_write(void *v)
2362 {
2363 struct vop_write_args /* {
2364 const struct vnodeop_desc *a_desc;
2365 struct vnode *a_vp;
2366 struct uio *a_uio;
2367 int a_ioflag;
2368 kauth_cred_t a_cred;
2369 }*/ *ap = v;
2370
2371 puffs_updatenode(ap->a_vp, PUFFS_UPDATEMTIME);
2372 return VOCALL(spec_vnodeop_p, VOFFSET(vop_write), v);
2373 }
2374
2375 int
2376 puffs_fifo_read(void *v)
2377 {
2378 struct vop_read_args /* {
2379 const struct vnodeop_desc *a_desc;
2380 struct vnode *a_vp;
2381 struct uio *a_uio;
2382 int a_ioflag;
2383 kauth_cred_t a_cred;
2384 } */ *ap = v;
2385
2386 puffs_updatenode(ap->a_vp, PUFFS_UPDATEATIME);
2387 return VOCALL(fifo_vnodeop_p, VOFFSET(vop_read), v);
2388 }
2389
2390 int
2391 puffs_fifo_write(void *v)
2392 {
2393 struct vop_write_args /* {
2394 const struct vnodeop_desc *a_desc;
2395 struct vnode *a_vp;
2396 struct uio *a_uio;
2397 int a_ioflag;
2398 kauth_cred_t a_cred;
2399 }*/ *ap = v;
2400
2401 puffs_updatenode(ap->a_vp, PUFFS_UPDATEMTIME);
2402 return VOCALL(fifo_vnodeop_p, VOFFSET(vop_write), v);
2403 }
2404