puffs_vnops.c revision 1.85 1 /* $NetBSD: puffs_vnops.c,v 1.85 2007/07/02 10:24:17 pooka Exp $ */
2
3 /*
4 * Copyright (c) 2005, 2006, 2007 Antti Kantee. All Rights Reserved.
5 *
6 * Development of this software was supported by the
7 * Google Summer of Code program and the Ulla Tuominen Foundation.
8 * The Google SoC project was mentored by Bill Studenmund.
9 *
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
12 * are met:
13 * 1. Redistributions of source code must retain the above copyright
14 * notice, this list of conditions and the following disclaimer.
15 * 2. Redistributions in binary form must reproduce the above copyright
16 * notice, this list of conditions and the following disclaimer in the
17 * documentation and/or other materials provided with the distribution.
18 *
19 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
20 * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
21 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
22 * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
23 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
25 * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 * SUCH DAMAGE.
30 */
31
32 #include <sys/cdefs.h>
33 __KERNEL_RCSID(0, "$NetBSD: puffs_vnops.c,v 1.85 2007/07/02 10:24:17 pooka Exp $");
34
35 #include <sys/param.h>
36 #include <sys/fstrans.h>
37 #include <sys/malloc.h>
38 #include <sys/mount.h>
39 #include <sys/namei.h>
40 #include <sys/vnode.h>
41 #include <uvm/uvm.h>
42
43 #include <fs/puffs/puffs_msgif.h>
44 #include <fs/puffs/puffs_sys.h>
45
46 #include <miscfs/fifofs/fifo.h>
47 #include <miscfs/genfs/genfs.h>
48 #include <miscfs/specfs/specdev.h>
49
50 int puffs_lookup(void *);
51 int puffs_create(void *);
52 int puffs_access(void *);
53 int puffs_mknod(void *);
54 int puffs_open(void *);
55 int puffs_close(void *);
56 int puffs_getattr(void *);
57 int puffs_setattr(void *);
58 int puffs_reclaim(void *);
59 int puffs_readdir(void *);
60 int puffs_poll(void *);
61 int puffs_fsync(void *);
62 int puffs_seek(void *);
63 int puffs_remove(void *);
64 int puffs_mkdir(void *);
65 int puffs_rmdir(void *);
66 int puffs_link(void *);
67 int puffs_readlink(void *);
68 int puffs_symlink(void *);
69 int puffs_rename(void *);
70 int puffs_read(void *);
71 int puffs_write(void *);
72 int puffs_fcntl(void *);
73 int puffs_ioctl(void *);
74 int puffs_inactive(void *);
75 int puffs_print(void *);
76 int puffs_pathconf(void *);
77 int puffs_advlock(void *);
78 int puffs_strategy(void *);
79 int puffs_bmap(void *);
80 int puffs_mmap(void *);
81 int puffs_getpages(void *);
82
83 int puffs_spec_read(void *);
84 int puffs_spec_write(void *);
85 int puffs_fifo_read(void *);
86 int puffs_fifo_write(void *);
87
88 int puffs_checkop(void *);
89
90
91 /* VOP_LEASE() not included */
92
93 int puffs_generic(void *);
94
95 #if 0
96 #define puffs_lock genfs_lock
97 #define puffs_unlock genfs_unlock
98 #define puffs_islocked genfs_islocked
99 #else
100 int puffs_lock(void *);
101 int puffs_unlock(void *);
102 int puffs_islocked(void *);
103 #endif
104
105 int (**puffs_vnodeop_p)(void *);
106 const struct vnodeopv_entry_desc puffs_vnodeop_entries[] = {
107 { &vop_default_desc, vn_default_error },
108 { &vop_lookup_desc, puffs_lookup }, /* REAL lookup */
109 { &vop_create_desc, puffs_checkop }, /* create */
110 { &vop_mknod_desc, puffs_checkop }, /* mknod */
111 { &vop_open_desc, puffs_open }, /* REAL open */
112 { &vop_close_desc, puffs_checkop }, /* close */
113 { &vop_access_desc, puffs_access }, /* REAL access */
114 { &vop_getattr_desc, puffs_checkop }, /* getattr */
115 { &vop_setattr_desc, puffs_checkop }, /* setattr */
116 { &vop_read_desc, puffs_checkop }, /* read */
117 { &vop_write_desc, puffs_checkop }, /* write */
118 { &vop_fcntl_desc, puffs_checkop }, /* fcntl */
119 { &vop_ioctl_desc, puffs_checkop }, /* ioctl */
120 { &vop_fsync_desc, puffs_fsync }, /* REAL fsync */
121 { &vop_seek_desc, puffs_checkop }, /* seek */
122 { &vop_remove_desc, puffs_checkop }, /* remove */
123 { &vop_link_desc, puffs_checkop }, /* link */
124 { &vop_rename_desc, puffs_checkop }, /* rename */
125 { &vop_mkdir_desc, puffs_checkop }, /* mkdir */
126 { &vop_rmdir_desc, puffs_checkop }, /* rmdir */
127 { &vop_symlink_desc, puffs_checkop }, /* symlink */
128 { &vop_readdir_desc, puffs_checkop }, /* readdir */
129 { &vop_readlink_desc, puffs_checkop }, /* readlink */
130 { &vop_getpages_desc, puffs_checkop }, /* getpages */
131 { &vop_putpages_desc, genfs_putpages }, /* REAL putpages */
132 { &vop_pathconf_desc, puffs_checkop }, /* pathconf */
133 { &vop_advlock_desc, puffs_checkop }, /* advlock */
134 { &vop_strategy_desc, puffs_strategy }, /* REAL strategy */
135 { &vop_revoke_desc, genfs_revoke }, /* REAL revoke */
136 { &vop_abortop_desc, genfs_abortop }, /* REAL abortop */
137 { &vop_inactive_desc, puffs_inactive }, /* REAL inactive */
138 { &vop_reclaim_desc, puffs_reclaim }, /* REAL reclaim */
139 { &vop_lock_desc, puffs_lock }, /* REAL lock */
140 { &vop_unlock_desc, puffs_unlock }, /* REAL unlock */
141 { &vop_bmap_desc, puffs_bmap }, /* REAL bmap */
142 { &vop_print_desc, puffs_print }, /* REAL print */
143 { &vop_islocked_desc, puffs_islocked }, /* REAL islocked */
144 { &vop_bwrite_desc, genfs_nullop }, /* REAL bwrite */
145 { &vop_mmap_desc, puffs_mmap }, /* REAL mmap */
146 { &vop_poll_desc, puffs_poll }, /* REAL poll */
147
148 { &vop_kqfilter_desc, genfs_eopnotsupp }, /* kqfilter XXX */
149 { NULL, NULL }
150 };
151 const struct vnodeopv_desc puffs_vnodeop_opv_desc =
152 { &puffs_vnodeop_p, puffs_vnodeop_entries };
153
154
155 int (**puffs_specop_p)(void *);
156 const struct vnodeopv_entry_desc puffs_specop_entries[] = {
157 { &vop_default_desc, vn_default_error },
158 { &vop_lookup_desc, spec_lookup }, /* lookup, ENOTDIR */
159 { &vop_create_desc, spec_create }, /* genfs_badop */
160 { &vop_mknod_desc, spec_mknod }, /* genfs_badop */
161 { &vop_open_desc, spec_open }, /* spec_open */
162 { &vop_close_desc, spec_close }, /* spec_close */
163 { &vop_access_desc, puffs_checkop }, /* access */
164 { &vop_getattr_desc, puffs_checkop }, /* getattr */
165 { &vop_setattr_desc, puffs_checkop }, /* setattr */
166 { &vop_read_desc, puffs_spec_read }, /* update, read */
167 { &vop_write_desc, puffs_spec_write }, /* update, write */
168 { &vop_lease_desc, spec_lease_check }, /* genfs_nullop */
169 { &vop_ioctl_desc, spec_ioctl }, /* spec_ioctl */
170 { &vop_fcntl_desc, genfs_fcntl }, /* dummy */
171 { &vop_poll_desc, spec_poll }, /* spec_poll */
172 { &vop_kqfilter_desc, spec_kqfilter }, /* spec_kqfilter */
173 { &vop_revoke_desc, spec_revoke }, /* genfs_revoke */
174 { &vop_mmap_desc, spec_mmap }, /* spec_mmap */
175 { &vop_fsync_desc, spec_fsync }, /* vflushbuf */
176 { &vop_seek_desc, spec_seek }, /* genfs_nullop */
177 { &vop_remove_desc, spec_remove }, /* genfs_badop */
178 { &vop_link_desc, spec_link }, /* genfs_badop */
179 { &vop_rename_desc, spec_rename }, /* genfs_badop */
180 { &vop_mkdir_desc, spec_mkdir }, /* genfs_badop */
181 { &vop_rmdir_desc, spec_rmdir }, /* genfs_badop */
182 { &vop_symlink_desc, spec_symlink }, /* genfs_badop */
183 { &vop_readdir_desc, spec_readdir }, /* genfs_badop */
184 { &vop_readlink_desc, spec_readlink }, /* genfs_badop */
185 { &vop_abortop_desc, spec_abortop }, /* genfs_badop */
186 { &vop_inactive_desc, puffs_inactive }, /* REAL inactive */
187 { &vop_reclaim_desc, puffs_reclaim }, /* REAL reclaim */
188 { &vop_lock_desc, puffs_lock }, /* REAL lock */
189 { &vop_unlock_desc, puffs_unlock }, /* REAL unlock */
190 { &vop_bmap_desc, spec_bmap }, /* dummy */
191 { &vop_strategy_desc, spec_strategy }, /* dev strategy */
192 { &vop_print_desc, puffs_print }, /* REAL print */
193 { &vop_islocked_desc, puffs_islocked }, /* REAL islocked */
194 { &vop_pathconf_desc, spec_pathconf }, /* pathconf */
195 { &vop_advlock_desc, spec_advlock }, /* lf_advlock */
196 { &vop_bwrite_desc, vn_bwrite }, /* bwrite */
197 { &vop_getpages_desc, spec_getpages }, /* genfs_getpages */
198 { &vop_putpages_desc, spec_putpages }, /* genfs_putpages */
199 #if 0
200 { &vop_openextattr_desc, _openextattr }, /* openextattr */
201 { &vop_closeextattr_desc, _closeextattr }, /* closeextattr */
202 { &vop_getextattr_desc, _getextattr }, /* getextattr */
203 { &vop_setextattr_desc, _setextattr }, /* setextattr */
204 { &vop_listextattr_desc, _listextattr }, /* listextattr */
205 { &vop_deleteextattr_desc, _deleteextattr }, /* deleteextattr */
206 #endif
207 { NULL, NULL }
208 };
209 const struct vnodeopv_desc puffs_specop_opv_desc =
210 { &puffs_specop_p, puffs_specop_entries };
211
212
213 int (**puffs_fifoop_p)(void *);
214 const struct vnodeopv_entry_desc puffs_fifoop_entries[] = {
215 { &vop_default_desc, vn_default_error },
216 { &vop_lookup_desc, fifo_lookup }, /* lookup, ENOTDIR */
217 { &vop_create_desc, fifo_create }, /* genfs_badop */
218 { &vop_mknod_desc, fifo_mknod }, /* genfs_badop */
219 { &vop_open_desc, fifo_open }, /* open */
220 { &vop_close_desc, fifo_close }, /* close */
221 { &vop_access_desc, puffs_checkop }, /* access */
222 { &vop_getattr_desc, puffs_checkop }, /* getattr */
223 { &vop_setattr_desc, puffs_checkop }, /* setattr */
224 { &vop_read_desc, puffs_fifo_read }, /* read, update */
225 { &vop_write_desc, puffs_fifo_write }, /* write, update */
226 { &vop_lease_desc, fifo_lease_check }, /* genfs_nullop */
227 { &vop_ioctl_desc, fifo_ioctl }, /* ioctl */
228 { &vop_fcntl_desc, genfs_fcntl }, /* dummy */
229 { &vop_poll_desc, fifo_poll }, /* poll */
230 { &vop_kqfilter_desc, fifo_kqfilter }, /* kqfilter */
231 { &vop_revoke_desc, fifo_revoke }, /* genfs_revoke */
232 { &vop_mmap_desc, fifo_mmap }, /* genfs_badop */
233 { &vop_fsync_desc, fifo_fsync }, /* genfs_nullop*/
234 { &vop_seek_desc, fifo_seek }, /* genfs_badop */
235 { &vop_remove_desc, fifo_remove }, /* genfs_badop */
236 { &vop_link_desc, fifo_link }, /* genfs_badop */
237 { &vop_rename_desc, fifo_rename }, /* genfs_badop */
238 { &vop_mkdir_desc, fifo_mkdir }, /* genfs_badop */
239 { &vop_rmdir_desc, fifo_rmdir }, /* genfs_badop */
240 { &vop_symlink_desc, fifo_symlink }, /* genfs_badop */
241 { &vop_readdir_desc, fifo_readdir }, /* genfs_badop */
242 { &vop_readlink_desc, fifo_readlink }, /* genfs_badop */
243 { &vop_abortop_desc, fifo_abortop }, /* genfs_badop */
244 { &vop_inactive_desc, puffs_inactive }, /* REAL inactive */
245 { &vop_reclaim_desc, puffs_reclaim }, /* REAL reclaim */
246 { &vop_lock_desc, puffs_lock }, /* REAL lock */
247 { &vop_unlock_desc, puffs_unlock }, /* REAL unlock */
248 { &vop_bmap_desc, fifo_bmap }, /* dummy */
249 { &vop_strategy_desc, fifo_strategy }, /* genfs_badop */
250 { &vop_print_desc, puffs_print }, /* REAL print */
251 { &vop_islocked_desc, puffs_islocked }, /* REAL islocked */
252 { &vop_pathconf_desc, fifo_pathconf }, /* pathconf */
253 { &vop_advlock_desc, fifo_advlock }, /* genfs_einval */
254 { &vop_bwrite_desc, vn_bwrite }, /* bwrite */
255 { &vop_putpages_desc, fifo_putpages }, /* genfs_null_putpages*/
256 #if 0
257 { &vop_openextattr_desc, _openextattr }, /* openextattr */
258 { &vop_closeextattr_desc, _closeextattr }, /* closeextattr */
259 { &vop_getextattr_desc, _getextattr }, /* getextattr */
260 { &vop_setextattr_desc, _setextattr }, /* setextattr */
261 { &vop_listextattr_desc, _listextattr }, /* listextattr */
262 { &vop_deleteextattr_desc, _deleteextattr }, /* deleteextattr */
263 #endif
264 { NULL, NULL }
265 };
266 const struct vnodeopv_desc puffs_fifoop_opv_desc =
267 { &puffs_fifoop_p, puffs_fifoop_entries };
268
269
270 /* "real" vnode operations */
271 int (**puffs_msgop_p)(void *);
272 const struct vnodeopv_entry_desc puffs_msgop_entries[] = {
273 { &vop_default_desc, vn_default_error },
274 { &vop_create_desc, puffs_create }, /* create */
275 { &vop_mknod_desc, puffs_mknod }, /* mknod */
276 { &vop_open_desc, puffs_open }, /* open */
277 { &vop_close_desc, puffs_close }, /* close */
278 { &vop_access_desc, puffs_access }, /* access */
279 { &vop_getattr_desc, puffs_getattr }, /* getattr */
280 { &vop_setattr_desc, puffs_setattr }, /* setattr */
281 { &vop_read_desc, puffs_read }, /* read */
282 { &vop_write_desc, puffs_write }, /* write */
283 { &vop_fcntl_desc, puffs_fcntl }, /* fcntl */
284 { &vop_ioctl_desc, puffs_ioctl }, /* ioctl */
285 { &vop_seek_desc, puffs_seek }, /* seek */
286 { &vop_remove_desc, puffs_remove }, /* remove */
287 { &vop_link_desc, puffs_link }, /* link */
288 { &vop_rename_desc, puffs_rename }, /* rename */
289 { &vop_mkdir_desc, puffs_mkdir }, /* mkdir */
290 { &vop_rmdir_desc, puffs_rmdir }, /* rmdir */
291 { &vop_symlink_desc, puffs_symlink }, /* symlink */
292 { &vop_readdir_desc, puffs_readdir }, /* readdir */
293 { &vop_readlink_desc, puffs_readlink }, /* readlink */
294 { &vop_print_desc, puffs_print }, /* print */
295 { &vop_islocked_desc, puffs_islocked }, /* islocked */
296 { &vop_pathconf_desc, puffs_pathconf }, /* pathconf */
297 { &vop_advlock_desc, puffs_advlock }, /* advlock */
298 { &vop_getpages_desc, puffs_getpages }, /* getpages */
299 { NULL, NULL }
300 };
301 const struct vnodeopv_desc puffs_msgop_opv_desc =
302 { &puffs_msgop_p, puffs_msgop_entries };
303
304
305 #define ERROUT(err) \
306 do { \
307 error = err; \
308 goto out; \
309 } while (/*CONSTCOND*/0)
310
311 /*
312 * This is a generic vnode operation handler. It checks if the necessary
313 * operations for the called vnode operation are implemented by userspace
314 * and either returns a dummy return value or proceeds to call the real
315 * vnode operation from puffs_msgop_v.
316 *
317 * XXX: this should described elsewhere and autogenerated, the complexity
318 * of the vnode operations vectors and their interrelationships is also
319 * getting a bit out of hand. Another problem is that we need this same
320 * information in the fs server code, so keeping the two in sync manually
321 * is not a viable (long term) plan.
322 */
323
324 /* not supported, handle locking protocol */
325 #define CHECKOP_NOTSUPP(op) \
326 case VOP_##op##_DESCOFFSET: \
327 if (pmp->pmp_vnopmask[PUFFS_VN_##op] == 0) \
328 return genfs_eopnotsupp(v); \
329 break
330
331 /* always succeed, no locking */
332 #define CHECKOP_SUCCESS(op) \
333 case VOP_##op##_DESCOFFSET: \
334 if (pmp->pmp_vnopmask[PUFFS_VN_##op] == 0) \
335 return 0; \
336 break
337
338 int
339 puffs_checkop(void *v)
340 {
341 struct vop_generic_args /* {
342 struct vnodeop_desc *a_desc;
343 spooky mystery contents;
344 } */ *ap = v;
345 struct vnodeop_desc *desc = ap->a_desc;
346 struct puffs_mount *pmp;
347 struct vnode *vp;
348 int offset, rv;
349
350 offset = ap->a_desc->vdesc_vp_offsets[0];
351 #ifdef DIAGNOSTIC
352 if (offset == VDESC_NO_OFFSET)
353 panic("puffs_checkop: no vnode, why did you call me?");
354 #endif
355 vp = *VOPARG_OFFSETTO(struct vnode **, offset, ap);
356 pmp = MPTOPUFFSMP(vp->v_mount);
357
358 DPRINTF_VERBOSE(("checkop call %s (%d), vp %p\n",
359 ap->a_desc->vdesc_name, ap->a_desc->vdesc_offset, vp));
360
361 if (!ALLOPS(pmp)) {
362 switch (desc->vdesc_offset) {
363 CHECKOP_NOTSUPP(CREATE);
364 CHECKOP_NOTSUPP(MKNOD);
365 CHECKOP_NOTSUPP(GETATTR);
366 CHECKOP_NOTSUPP(SETATTR);
367 CHECKOP_NOTSUPP(READ);
368 CHECKOP_NOTSUPP(WRITE);
369 CHECKOP_NOTSUPP(FCNTL);
370 CHECKOP_NOTSUPP(IOCTL);
371 CHECKOP_NOTSUPP(REMOVE);
372 CHECKOP_NOTSUPP(LINK);
373 CHECKOP_NOTSUPP(RENAME);
374 CHECKOP_NOTSUPP(MKDIR);
375 CHECKOP_NOTSUPP(RMDIR);
376 CHECKOP_NOTSUPP(SYMLINK);
377 CHECKOP_NOTSUPP(READDIR);
378 CHECKOP_NOTSUPP(READLINK);
379 CHECKOP_NOTSUPP(PRINT);
380 CHECKOP_NOTSUPP(PATHCONF);
381 CHECKOP_NOTSUPP(ADVLOCK);
382
383 CHECKOP_SUCCESS(ACCESS);
384 CHECKOP_SUCCESS(CLOSE);
385 CHECKOP_SUCCESS(SEEK);
386
387 case VOP_GETPAGES_DESCOFFSET:
388 if (!EXISTSOP(pmp, READ))
389 return genfs_eopnotsupp(v);
390 break;
391
392 default:
393 panic("puffs_checkop: unhandled vnop %d",
394 desc->vdesc_offset);
395 }
396 }
397
398 rv = VOCALL(puffs_msgop_p, ap->a_desc->vdesc_offset, v);
399
400 DPRINTF_VERBOSE(("checkop return %s (%d), vp %p: %d\n",
401 ap->a_desc->vdesc_name, ap->a_desc->vdesc_offset, vp, rv));
402
403 return rv;
404 }
405
406
407 int
408 puffs_lookup(void *v)
409 {
410 struct vop_lookup_args /* {
411 const struct vnodeop_desc *a_desc;
412 struct vnode *a_dvp;
413 struct vnode **a_vpp;
414 struct componentname *a_cnp;
415 } */ *ap = v;
416 struct puffs_mount *pmp;
417 struct componentname *cnp;
418 struct vnode *vp, *dvp;
419 struct puffs_node *dpn;
420 int isdot;
421 int error;
422
423 PUFFS_VNREQ(lookup);
424
425 pmp = MPTOPUFFSMP(ap->a_dvp->v_mount);
426 cnp = ap->a_cnp;
427 dvp = ap->a_dvp;
428 *ap->a_vpp = NULL;
429
430 /* first things first: check access */
431 error = VOP_ACCESS(dvp, VEXEC, cnp->cn_cred, cnp->cn_lwp);
432 if (error)
433 return error;
434
435 isdot = cnp->cn_namelen == 1 && *cnp->cn_nameptr == '.';
436
437 DPRINTF(("puffs_lookup: \"%s\", parent vnode %p, op: %lx\n",
438 cnp->cn_nameptr, dvp, cnp->cn_nameiop));
439
440 /*
441 * Check if someone fed it into the cache
442 */
443 if (PUFFS_USE_NAMECACHE(pmp)) {
444 error = cache_lookup(dvp, ap->a_vpp, cnp);
445
446 if (error >= 0)
447 return error;
448 }
449
450 if (isdot) {
451 vp = ap->a_dvp;
452 vref(vp);
453 *ap->a_vpp = vp;
454 return 0;
455 }
456
457 puffs_makecn(&lookup_arg.pvnr_cn, &lookup_arg.pvnr_cn_cred,
458 &lookup_arg.pvnr_cn_cid, cnp, PUFFS_USE_FULLPNBUF(pmp));
459
460 if (cnp->cn_flags & ISDOTDOT)
461 VOP_UNLOCK(dvp, 0);
462
463 error = puffs_vntouser(pmp, PUFFS_VN_LOOKUP,
464 &lookup_arg, sizeof(lookup_arg), 0, dvp, NULL);
465 DPRINTF(("puffs_lookup: return of the userspace, part %d\n", error));
466
467 /*
468 * In case of error, there is no new vnode to play with, so be
469 * happy with the NULL value given to vpp in the beginning.
470 * Also, check if this really was an error or the target was not
471 * present. Either treat it as a non-error for CREATE/RENAME or
472 * enter the component into the negative name cache (if desired).
473 */
474 if (error) {
475 if (error == ENOENT) {
476 if ((cnp->cn_flags & ISLASTCN)
477 && (cnp->cn_nameiop == CREATE
478 || cnp->cn_nameiop == RENAME)) {
479 cnp->cn_flags |= SAVENAME;
480 error = EJUSTRETURN;
481 } else {
482 if ((cnp->cn_flags & MAKEENTRY)
483 && PUFFS_USE_NAMECACHE(pmp))
484 cache_enter(dvp, NULL, cnp);
485 }
486 } else if (error < 0) {
487 error = EINVAL;
488 }
489 goto out;
490 }
491
492 /*
493 * Check that we don't get our parent node back, that would cause
494 * a pretty obvious deadlock.
495 */
496 dpn = dvp->v_data;
497 if (lookup_arg.pvnr_newnode == dpn->pn_cookie) {
498 error = EINVAL;
499 goto out;
500 }
501
502 /* XXX: race here */
503 /* XXX2: this check for node existence twice */
504 error = puffs_pnode2vnode(pmp, lookup_arg.pvnr_newnode, 1, &vp);
505 if (error) {
506 error = puffs_getvnode(dvp->v_mount,
507 lookup_arg.pvnr_newnode, lookup_arg.pvnr_vtype,
508 lookup_arg.pvnr_size, lookup_arg.pvnr_rdev, &vp);
509 if (error) {
510 goto out;
511 }
512 vn_lock(vp, LK_EXCLUSIVE | LK_RETRY);
513 }
514 *ap->a_vpp = vp;
515
516 if ((cnp->cn_flags & MAKEENTRY) != 0 && PUFFS_USE_NAMECACHE(pmp))
517 cache_enter(dvp, vp, cnp);
518
519 out:
520 if (cnp->cn_flags & ISDOTDOT)
521 vn_lock(dvp, LK_EXCLUSIVE | LK_RETRY);
522
523 DPRINTF(("puffs_lookup: returning %d %p\n", error, *ap->a_vpp));
524 return error;
525 }
526
527 int
528 puffs_create(void *v)
529 {
530 struct vop_create_args /* {
531 const struct vnodeop_desc *a_desc;
532 struct vnode *a_dvp;
533 struct vnode **a_vpp;
534 struct componentname *a_cnp;
535 struct vattr *a_vap;
536 } */ *ap = v;
537 struct puffs_mount *pmp = MPTOPUFFSMP(ap->a_dvp->v_mount);
538 int error;
539
540 PUFFS_VNREQ(create);
541
542 DPRINTF(("puffs_create: dvp %p, cnp: %s\n",
543 ap->a_dvp, ap->a_cnp->cn_nameptr));
544
545 puffs_makecn(&create_arg.pvnr_cn, &create_arg.pvnr_cn_cred,
546 &create_arg.pvnr_cn_cid, ap->a_cnp, PUFFS_USE_FULLPNBUF(pmp));
547 create_arg.pvnr_va = *ap->a_vap;
548
549 error = puffs_vntouser(pmp, PUFFS_VN_CREATE,
550 &create_arg, sizeof(create_arg), 0, ap->a_dvp, NULL);
551 if (error)
552 goto out;
553
554 error = puffs_newnode(ap->a_dvp->v_mount, ap->a_dvp, ap->a_vpp,
555 create_arg.pvnr_newnode, ap->a_cnp, ap->a_vap->va_type, 0);
556 /* XXX: in case of error, need to uncommit userspace transaction */
557
558 out:
559 if (error || (ap->a_cnp->cn_flags & SAVESTART) == 0)
560 PNBUF_PUT(ap->a_cnp->cn_pnbuf);
561 vput(ap->a_dvp);
562
563 DPRINTF(("puffs_create: return %d\n", error));
564 return error;
565 }
566
567 int
568 puffs_mknod(void *v)
569 {
570 struct vop_mknod_args /* {
571 const struct vnodeop_desc *a_desc;
572 struct vnode *a_dvp;
573 struct vnode **a_vpp;
574 struct componentname *a_cnp;
575 struct vattr *a_vap;
576 } */ *ap = v;
577 struct puffs_mount *pmp = MPTOPUFFSMP(ap->a_dvp->v_mount);
578 int error;
579
580 PUFFS_VNREQ(mknod);
581
582 puffs_makecn(&mknod_arg.pvnr_cn, &mknod_arg.pvnr_cn_cred,
583 &mknod_arg.pvnr_cn_cid, ap->a_cnp, PUFFS_USE_FULLPNBUF(pmp));
584 mknod_arg.pvnr_va = *ap->a_vap;
585
586 error = puffs_vntouser(pmp, PUFFS_VN_MKNOD,
587 &mknod_arg, sizeof(mknod_arg), 0, ap->a_dvp, NULL);
588 if (error)
589 goto out;
590
591 error = puffs_newnode(ap->a_dvp->v_mount, ap->a_dvp, ap->a_vpp,
592 mknod_arg.pvnr_newnode, ap->a_cnp, ap->a_vap->va_type,
593 ap->a_vap->va_rdev);
594
595 out:
596 if (error || (ap->a_cnp->cn_flags & SAVESTART) == 0)
597 PNBUF_PUT(ap->a_cnp->cn_pnbuf);
598 vput(ap->a_dvp);
599 return error;
600 }
601
602 int
603 puffs_open(void *v)
604 {
605 struct vop_open_args /* {
606 const struct vnodeop_desc *a_desc;
607 struct vnode *a_vp;
608 int a_mode;
609 kauth_cred_t a_cred;
610 struct lwp *a_l;
611 } */ *ap = v;
612 struct vnode *vp = ap->a_vp;
613 struct puffs_mount *pmp = MPTOPUFFSMP(vp->v_mount);
614 int mode = ap->a_mode;
615 int error;
616
617 PUFFS_VNREQ(open);
618 DPRINTF(("puffs_open: vp %p, mode 0x%x\n", vp, mode));
619
620 if (vp->v_type == VREG && mode & FWRITE && !EXISTSOP(pmp, WRITE))
621 ERROUT(EROFS);
622
623 if (!EXISTSOP(pmp, OPEN))
624 ERROUT(0);
625
626 open_arg.pvnr_mode = mode;
627 puffs_credcvt(&open_arg.pvnr_cred, ap->a_cred);
628 puffs_cidcvt(&open_arg.pvnr_cid, ap->a_l);
629
630 error = puffs_vntouser(MPTOPUFFSMP(vp->v_mount), PUFFS_VN_OPEN,
631 &open_arg, sizeof(open_arg), 0, vp, NULL);
632
633 out:
634 DPRINTF(("puffs_open: returning %d\n", error));
635 return error;
636 }
637
638 int
639 puffs_close(void *v)
640 {
641 struct vop_close_args /* {
642 const struct vnodeop_desc *a_desc;
643 struct vnode *a_vp;
644 int a_fflag;
645 kauth_cred_t a_cred;
646 struct lwp *a_l;
647 } */ *ap = v;
648 struct puffs_vnreq_close *close_argp;
649
650 close_argp = malloc(sizeof(struct puffs_vnreq_close),
651 M_PUFFS, M_WAITOK | M_ZERO);
652 close_argp->pvnr_fflag = ap->a_fflag;
653 puffs_credcvt(&close_argp->pvnr_cred, ap->a_cred);
654 puffs_cidcvt(&close_argp->pvnr_cid, ap->a_l);
655
656 puffs_vntouser_faf(MPTOPUFFSMP(ap->a_vp->v_mount), PUFFS_VN_CLOSE,
657 close_argp, sizeof(struct puffs_vnreq_close), ap->a_vp);
658
659 return 0;
660 }
661
662 int
663 puffs_access(void *v)
664 {
665 struct vop_access_args /* {
666 const struct vnodeop_desc *a_desc;
667 struct vnode *a_vp;
668 int a_mode;
669 kauth_cred_t a_cred;
670 struct lwp *a_l;
671 } */ *ap = v;
672 struct vnode *vp = ap->a_vp;
673 struct puffs_mount *pmp = MPTOPUFFSMP(vp->v_mount);
674 int mode = ap->a_mode;
675
676 PUFFS_VNREQ(access);
677
678 if (vp->v_type == VREG && mode & VWRITE && !EXISTSOP(pmp, WRITE))
679 return EROFS;
680
681 if (!EXISTSOP(pmp, ACCESS))
682 return 0;
683
684 access_arg.pvnr_mode = ap->a_mode;
685 puffs_credcvt(&access_arg.pvnr_cred, ap->a_cred);
686 puffs_cidcvt(&access_arg.pvnr_cid, ap->a_l);
687
688 return puffs_vntouser(MPTOPUFFSMP(vp->v_mount), PUFFS_VN_ACCESS,
689 &access_arg, sizeof(access_arg), 0, vp, NULL);
690 }
691
692 int
693 puffs_getattr(void *v)
694 {
695 struct vop_getattr_args /* {
696 const struct vnodeop_desc *a_desc;
697 struct vnode *a_vp;
698 struct vattr *a_vap;
699 kauth_cred_t a_cred;
700 struct lwp *a_l;
701 } */ *ap = v;
702 struct mount *mp;
703 struct vnode *vp;
704 struct vattr *vap, *rvap;
705 struct puffs_node *pn;
706 int error;
707
708 PUFFS_VNREQ(getattr);
709
710 vp = ap->a_vp;
711 mp = vp->v_mount;
712 vap = ap->a_vap;
713
714 vattr_null(&getattr_arg.pvnr_va);
715 puffs_credcvt(&getattr_arg.pvnr_cred, ap->a_cred);
716 puffs_cidcvt(&getattr_arg.pvnr_cid, ap->a_l);
717
718 error = puffs_vntouser(MPTOPUFFSMP(vp->v_mount), PUFFS_VN_GETATTR,
719 &getattr_arg, sizeof(getattr_arg), 0, vp, NULL);
720 if (error)
721 return error;
722
723 rvap = &getattr_arg.pvnr_va;
724 /*
725 * Don't listen to the file server regarding special device
726 * size info, the file server doesn't know anything about them.
727 */
728 if (vp->v_type == VBLK || vp->v_type == VCHR)
729 rvap->va_size = vp->v_size;
730
731 /* Ditto for blocksize (ufs comment: this doesn't belong here) */
732 if (vp->v_type == VBLK)
733 rvap->va_blocksize = BLKDEV_IOSIZE;
734 else if (vp->v_type == VCHR)
735 rvap->va_blocksize = MAXBSIZE;
736
737 (void) memcpy(vap, rvap, sizeof(struct vattr));
738 vap->va_fsid = mp->mnt_stat.f_fsidx.__fsid_val[0];
739
740 pn = VPTOPP(vp);
741 if (pn->pn_stat & PNODE_METACACHE_ATIME)
742 vap->va_atime = pn->pn_mc_atime;
743 if (pn->pn_stat & PNODE_METACACHE_CTIME)
744 vap->va_ctime = pn->pn_mc_ctime;
745 if (pn->pn_stat & PNODE_METACACHE_MTIME)
746 vap->va_mtime = pn->pn_mc_mtime;
747 if (pn->pn_stat & PNODE_METACACHE_SIZE) {
748 vap->va_size = pn->pn_mc_size;
749 } else {
750 if (rvap->va_size != VNOVAL
751 && vp->v_type != VBLK && vp->v_type != VCHR)
752 uvm_vnp_setsize(vp, rvap->va_size);
753 }
754
755 return 0;
756 }
757
758 int
759 puffs_setattr(void *v)
760 {
761 struct vop_getattr_args /* {
762 const struct vnodeop_desc *a_desc;
763 struct vnode *a_vp;
764 struct vattr *a_vap;
765 kauth_cred_t a_cred;
766 struct lwp *a_l;
767 } */ *ap = v;
768 int error;
769 struct vattr *vap = ap->a_vap;
770 struct puffs_node *pn = ap->a_vp->v_data;
771
772 PUFFS_VNREQ(setattr);
773
774 /*
775 * Flush metacache first. If we are called with some explicit
776 * parameters, treat them as information overriding metacache
777 * information.
778 */
779 if (pn->pn_stat & PNODE_METACACHE_MASK) {
780 if ((pn->pn_stat & PNODE_METACACHE_ATIME)
781 && vap->va_atime.tv_sec == VNOVAL)
782 vap->va_atime = pn->pn_mc_atime;
783 if ((pn->pn_stat & PNODE_METACACHE_CTIME)
784 && vap->va_ctime.tv_sec == VNOVAL)
785 vap->va_ctime = pn->pn_mc_ctime;
786 if ((pn->pn_stat & PNODE_METACACHE_MTIME)
787 && vap->va_mtime.tv_sec == VNOVAL)
788 vap->va_mtime = pn->pn_mc_mtime;
789 if ((pn->pn_stat & PNODE_METACACHE_SIZE)
790 && vap->va_size == VNOVAL)
791 vap->va_size = pn->pn_mc_size;
792
793 pn->pn_stat &= ~PNODE_METACACHE_MASK;
794 }
795
796 (void)memcpy(&setattr_arg.pvnr_va, vap, sizeof(struct vattr));
797 puffs_credcvt(&setattr_arg.pvnr_cred, ap->a_cred);
798 puffs_cidcvt(&setattr_arg.pvnr_cid, ap->a_l);
799
800 error = puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount), PUFFS_VN_SETATTR,
801 &setattr_arg, sizeof(setattr_arg), 0, ap->a_vp, NULL);
802 if (error)
803 return error;
804
805 if (vap->va_size != VNOVAL)
806 uvm_vnp_setsize(ap->a_vp, vap->va_size);
807
808 return 0;
809 }
810
811 int
812 puffs_inactive(void *v)
813 {
814 struct vop_inactive_args /* {
815 const struct vnodeop_desc *a_desc;
816 struct vnode *a_vp;
817 struct lwp *a_l;
818 } */ *ap = v;
819 struct puffs_mount *pmp;
820 struct puffs_node *pnode;
821 int rv, call;
822
823 PUFFS_VNREQ(inactive);
824
825 /*
826 * XXX: think about this after we really start unlocking
827 * when going to userspace
828 */
829 pnode = ap->a_vp->v_data;
830
831 pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
832
833 puffs_cidcvt(&inactive_arg.pvnr_cid, ap->a_l);
834
835 if (EXISTSOP(pmp, INACTIVE))
836 if (pmp->pmp_flags & PUFFS_KFLAG_IAONDEMAND)
837 if ((pnode->pn_stat & PNODE_DOINACT) || ALLOPS(pmp))
838 call = 1;
839 else
840 call = 0;
841 else
842 call = 1;
843 else
844 call = 0;
845
846 if (call)
847 rv = puffs_vntouser(pmp, PUFFS_VN_INACTIVE,
848 &inactive_arg, sizeof(inactive_arg), 0, ap->a_vp, NULL);
849 else
850 rv = 1; /* see below */
851 pnode->pn_stat &= ~PNODE_DOINACT;
852
853 VOP_UNLOCK(ap->a_vp, 0);
854
855 /*
856 * file server thinks it's gone? then don't be afraid care,
857 * node's life was already all it would ever be
858 */
859 if (pnode->pn_stat & PNODE_NOREFS) {
860 pnode->pn_stat |= PNODE_DYING;
861 vrecycle(ap->a_vp, NULL, ap->a_l);
862 }
863
864 return 0;
865 }
866
867 /*
868 * always FAF, we don't really care if the server wants to fail to
869 * reclaim the node or not
870 */
871 int
872 puffs_reclaim(void *v)
873 {
874 struct vop_reclaim_args /* {
875 const struct vnodeop_desc *a_desc;
876 struct vnode *a_vp;
877 struct lwp *a_l;
878 } */ *ap = v;
879 struct puffs_mount *pmp;
880 struct puffs_vnreq_reclaim *reclaim_argp;
881
882 pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
883
884 /*
885 * first things first: check if someone is trying to reclaim the
886 * root vnode. do not allow that to travel to userspace.
887 * Note that we don't need to take the lock similarly to
888 * puffs_root(), since there is only one of us.
889 */
890 if (ap->a_vp->v_flag & VROOT) {
891 mutex_enter(&pmp->pmp_lock);
892 KASSERT(pmp->pmp_root != NULL);
893 pmp->pmp_root = NULL;
894 mutex_exit(&pmp->pmp_lock);
895 goto out;
896 }
897
898 if (!EXISTSOP(pmp, RECLAIM))
899 goto out;
900
901 reclaim_argp = malloc(sizeof(struct puffs_vnreq_reclaim),
902 M_PUFFS, M_WAITOK | M_ZERO);
903 puffs_cidcvt(&reclaim_argp->pvnr_cid, ap->a_l);
904
905 puffs_vntouser_faf(pmp, PUFFS_VN_RECLAIM,
906 reclaim_argp, sizeof(struct puffs_vnreq_reclaim), ap->a_vp);
907
908 out:
909 if (PUFFS_USE_NAMECACHE(pmp))
910 cache_purge(ap->a_vp);
911 puffs_putvnode(ap->a_vp);
912
913 return 0;
914 }
915
916 #define CSIZE sizeof(**ap->a_cookies)
917 int
918 puffs_readdir(void *v)
919 {
920 struct vop_readdir_args /* {
921 const struct vnodeop_desc *a_desc;
922 struct vnode *a_vp;
923 struct uio *a_uio;
924 kauth_cred_t a_cred;
925 int *a_eofflag;
926 off_t **a_cookies;
927 int *a_ncookies;
928 } */ *ap = v;
929 struct puffs_mount *pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
930 struct puffs_vnreq_readdir *readdir_argp;
931 size_t argsize, tomove, cookiemem, cookiesmax;
932 struct uio *uio = ap->a_uio;
933 size_t howmuch;
934 int error;
935
936 if (ap->a_cookies) {
937 KASSERT(ap->a_ncookies != NULL);
938 if (pmp->pmp_args.pa_fhsize == 0)
939 return EOPNOTSUPP;
940 cookiesmax = uio->uio_resid/_DIRENT_MINSIZE((struct dirent *)0);
941 cookiemem = ALIGN(cookiesmax*CSIZE); /* play safe */
942 } else {
943 cookiesmax = 0;
944 cookiemem = 0;
945 }
946
947 argsize = sizeof(struct puffs_vnreq_readdir);
948 tomove = uio->uio_resid + cookiemem;
949 readdir_argp = malloc(argsize + tomove, M_PUFFS, M_ZERO | M_WAITOK);
950
951 puffs_credcvt(&readdir_argp->pvnr_cred, ap->a_cred);
952 readdir_argp->pvnr_offset = uio->uio_offset;
953 readdir_argp->pvnr_resid = uio->uio_resid;
954 readdir_argp->pvnr_ncookies = cookiesmax;
955 readdir_argp->pvnr_eofflag = 0;
956 readdir_argp->pvnr_dentoff = cookiemem;
957
958 error = puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount),
959 PUFFS_VN_READDIR, readdir_argp, argsize, tomove,
960 ap->a_vp, NULL);
961 if (error)
962 goto out;
963
964 /* userspace is cheating? */
965 if (readdir_argp->pvnr_resid > uio->uio_resid
966 || readdir_argp->pvnr_ncookies > cookiesmax)
967 ERROUT(EINVAL);
968
969 /* check eof */
970 if (readdir_argp->pvnr_eofflag)
971 *ap->a_eofflag = 1;
972
973 /* bouncy-wouncy with the directory data */
974 howmuch = uio->uio_resid - readdir_argp->pvnr_resid;
975
976 /* force eof if no data was returned (getcwd() needs this) */
977 if (howmuch == 0) {
978 *ap->a_eofflag = 1;
979 goto out;
980 }
981
982 error = uiomove(readdir_argp->pvnr_data + cookiemem, howmuch, uio);
983 if (error)
984 goto out;
985
986 /* provide cookies to caller if so desired */
987 if (ap->a_cookies) {
988 *ap->a_cookies = malloc(readdir_argp->pvnr_ncookies*CSIZE,
989 M_TEMP, M_WAITOK);
990 *ap->a_ncookies = readdir_argp->pvnr_ncookies;
991 memcpy(*ap->a_cookies, readdir_argp->pvnr_data,
992 *ap->a_ncookies*CSIZE);
993 }
994
995 /* next readdir starts here */
996 uio->uio_offset = readdir_argp->pvnr_offset;
997
998 out:
999 free(readdir_argp, M_PUFFS);
1000 return error;
1001 }
1002 #undef CSIZE
1003
1004 /*
1005 * poll works by consuming the bitmask in pn_revents. If there are
1006 * events available, poll returns immediately. If not, it issues a
1007 * poll to userspace, selrecords itself and returns with no available
1008 * events. When the file server returns, it executes puffs_parkdone_poll(),
1009 * where available events are added to the bitmask. selnotify() is
1010 * then also executed by that function causing us to enter here again
1011 * and hopefully find the missing bits (unless someone got them first,
1012 * in which case it starts all over again).
1013 */
1014 int
1015 puffs_poll(void *v)
1016 {
1017 struct vop_poll_args /* {
1018 const struct vnodeop_desc *a_desc;
1019 struct vnode *a_vp;
1020 int a_events;
1021 struct lwp *a_l;
1022 }*/ *ap = v;
1023 struct vnode *vp = ap->a_vp;
1024 struct puffs_mount *pmp = MPTOPUFFSMP(vp->v_mount);
1025 struct puffs_vnreq_poll *poll_argp;
1026 struct puffs_node *pn = vp->v_data;
1027 int events;
1028
1029 if (EXISTSOP(pmp, POLL)) {
1030 mutex_enter(&pn->pn_mtx);
1031 events = pn->pn_revents & ap->a_events;
1032 if (events & ap->a_events) {
1033 pn->pn_revents &= ~ap->a_events;
1034 mutex_exit(&pn->pn_mtx);
1035
1036 return events;
1037 } else {
1038 puffs_referencenode(pn);
1039 mutex_exit(&pn->pn_mtx);
1040
1041 /* freed in puffs_parkdone_poll */
1042 poll_argp = malloc(sizeof(struct puffs_vnreq_poll),
1043 M_PUFFS, M_ZERO | M_WAITOK);
1044
1045 poll_argp->pvnr_events = ap->a_events;
1046 puffs_cidcvt(&poll_argp->pvnr_cid, ap->a_l);
1047
1048 selrecord(ap->a_l, &pn->pn_sel);
1049 puffs_vntouser_call(pmp, PUFFS_VN_POLL,
1050 poll_argp, sizeof(struct puffs_vnreq_poll), 0,
1051 puffs_parkdone_poll, pn,
1052 vp, NULL);
1053
1054 return 0;
1055 }
1056 } else {
1057 return genfs_poll(v);
1058 }
1059 }
1060
1061 int
1062 puffs_fsync(void *v)
1063 {
1064 struct vop_fsync_args /* {
1065 const struct vnodeop_desc *a_desc;
1066 struct vnode *a_vp;
1067 kauth_cred_t a_cred;
1068 int a_flags;
1069 off_t a_offlo;
1070 off_t a_offhi;
1071 struct lwp *a_l;
1072 } */ *ap = v;
1073 struct vattr va;
1074 struct puffs_mount *pmp;
1075 struct puffs_vnreq_fsync *fsync_argp;
1076 struct vnode *vp;
1077 struct puffs_node *pn;
1078 int pflags, error, dofaf;
1079
1080 PUFFS_VNREQ(fsync);
1081
1082 vp = ap->a_vp;
1083 pn = VPTOPP(vp);
1084 pmp = MPTOPUFFSMP(vp->v_mount);
1085
1086 /* flush out information from our metacache, see vop_setattr */
1087 if (pn->pn_stat & PNODE_METACACHE_MASK
1088 && (pn->pn_stat & PNODE_DYING) == 0) {
1089 vattr_null(&va);
1090 error = VOP_SETATTR(vp, &va, FSCRED, NULL);
1091 if (error)
1092 return error;
1093 }
1094
1095 /*
1096 * flush pages to avoid being overly dirty
1097 */
1098 pflags = PGO_CLEANIT;
1099 if (ap->a_flags & FSYNC_WAIT)
1100 pflags |= PGO_SYNCIO;
1101 simple_lock(&vp->v_interlock);
1102 error = VOP_PUTPAGES(vp, trunc_page(ap->a_offlo),
1103 round_page(ap->a_offhi), pflags);
1104 if (error)
1105 return error;
1106
1107 /*
1108 * HELLO! We exit already here if the user server does not
1109 * support fsync OR if we should call fsync for a node which
1110 * has references neither in the kernel or the fs server.
1111 * Otherwise we continue to issue fsync() forward.
1112 */
1113 if (!EXISTSOP(pmp, FSYNC) || (pn->pn_stat & PNODE_DYING))
1114 return 0;
1115
1116 dofaf = (ap->a_flags & FSYNC_WAIT) == 0 || ap->a_flags == FSYNC_LAZY;
1117 /*
1118 * We abuse VXLOCK to mean "vnode is going to die", so we issue
1119 * only FAFs for those. Otherwise there's a danger of deadlock,
1120 * since the execution context here might be the user server
1121 * doing some operation on another fs, which in turn caused a
1122 * vnode to be reclaimed from the freelist for this fs.
1123 */
1124 if (dofaf == 0) {
1125 simple_lock(&vp->v_interlock);
1126 if (vp->v_flag & VXLOCK)
1127 dofaf = 1;
1128 simple_unlock(&vp->v_interlock);
1129 }
1130
1131 if (dofaf == 0) {
1132 fsync_argp = &fsync_arg;
1133 } else {
1134 fsync_argp = malloc(sizeof(struct puffs_vnreq_fsync),
1135 M_PUFFS, M_ZERO | M_NOWAIT);
1136 if (fsync_argp == NULL)
1137 return ENOMEM;
1138 }
1139
1140 puffs_credcvt(&fsync_argp->pvnr_cred, ap->a_cred);
1141 fsync_argp->pvnr_flags = ap->a_flags;
1142 fsync_argp->pvnr_offlo = ap->a_offlo;
1143 fsync_argp->pvnr_offhi = ap->a_offhi;
1144 puffs_cidcvt(&fsync_argp->pvnr_cid, ap->a_l);
1145
1146 /*
1147 * XXX: see comment at puffs_getattr about locking
1148 *
1149 * If we are not required to wait, do a FAF operation.
1150 * Otherwise block here.
1151 */
1152 if (dofaf == 0) {
1153 error = puffs_vntouser(MPTOPUFFSMP(vp->v_mount),
1154 PUFFS_VN_FSYNC, fsync_argp, sizeof(*fsync_argp), 0,
1155 vp, NULL);
1156 } else {
1157 /* FAF is always "succesful" */
1158 error = 0;
1159 puffs_vntouser_faf(MPTOPUFFSMP(vp->v_mount),
1160 PUFFS_VN_FSYNC, fsync_argp, sizeof(*fsync_argp), vp);
1161 }
1162
1163 return error;
1164 }
1165
1166 int
1167 puffs_seek(void *v)
1168 {
1169 struct vop_seek_args /* {
1170 const struct vnodeop_desc *a_desc;
1171 struct vnode *a_vp;
1172 off_t a_oldoff;
1173 off_t a_newoff;
1174 kauth_cred_t a_cred;
1175 } */ *ap = v;
1176
1177 PUFFS_VNREQ(seek);
1178
1179 seek_arg.pvnr_oldoff = ap->a_oldoff;
1180 seek_arg.pvnr_newoff = ap->a_newoff;
1181 puffs_credcvt(&seek_arg.pvnr_cred, ap->a_cred);
1182
1183 /*
1184 * XXX: seems like seek is called with an unlocked vp, but
1185 * it can't hurt to play safe
1186 */
1187 return puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount), PUFFS_VN_SEEK,
1188 &seek_arg, sizeof(seek_arg), 0, ap->a_vp, NULL);
1189 }
1190
1191 int
1192 puffs_remove(void *v)
1193 {
1194 struct vop_remove_args /* {
1195 const struct vnodeop_desc *a_desc;
1196 struct vnode *a_dvp;
1197 struct vnode *a_vp;
1198 struct componentname *a_cnp;
1199 } */ *ap = v;
1200 struct puffs_mount *pmp = MPTOPUFFSMP(ap->a_dvp->v_mount);
1201 int error;
1202
1203 PUFFS_VNREQ(remove);
1204
1205 remove_arg.pvnr_cookie_targ = VPTOPNC(ap->a_vp);
1206 puffs_makecn(&remove_arg.pvnr_cn, &remove_arg.pvnr_cn_cred,
1207 &remove_arg.pvnr_cn_cid, ap->a_cnp, PUFFS_USE_FULLPNBUF(pmp));
1208
1209 error = puffs_vntouser(pmp, PUFFS_VN_REMOVE,
1210 &remove_arg, sizeof(remove_arg), 0, ap->a_dvp, ap->a_vp);
1211
1212 vput(ap->a_vp);
1213 if (ap->a_dvp == ap->a_vp)
1214 vrele(ap->a_dvp);
1215 else
1216 vput(ap->a_dvp);
1217
1218 return error;
1219 }
1220
1221 int
1222 puffs_mkdir(void *v)
1223 {
1224 struct vop_mkdir_args /* {
1225 const struct vnodeop_desc *a_desc;
1226 struct vnode *a_dvp;
1227 struct vnode **a_vpp;
1228 struct componentname *a_cnp;
1229 struct vattr *a_vap;
1230 } */ *ap = v;
1231 struct puffs_mount *pmp = MPTOPUFFSMP(ap->a_dvp->v_mount);
1232 int error;
1233
1234 PUFFS_VNREQ(mkdir);
1235
1236 puffs_makecn(&mkdir_arg.pvnr_cn, &mkdir_arg.pvnr_cn_cred,
1237 &mkdir_arg.pvnr_cn_cid, ap->a_cnp, PUFFS_USE_FULLPNBUF(pmp));
1238 mkdir_arg.pvnr_va = *ap->a_vap;
1239
1240 error = puffs_vntouser(pmp, PUFFS_VN_MKDIR,
1241 &mkdir_arg, sizeof(mkdir_arg), 0, ap->a_dvp, NULL);
1242 if (error)
1243 goto out;
1244
1245 error = puffs_newnode(ap->a_dvp->v_mount, ap->a_dvp, ap->a_vpp,
1246 mkdir_arg.pvnr_newnode, ap->a_cnp, VDIR, 0);
1247
1248 out:
1249 if (error || (ap->a_cnp->cn_flags & SAVESTART) == 0)
1250 PNBUF_PUT(ap->a_cnp->cn_pnbuf);
1251 vput(ap->a_dvp);
1252 return error;
1253 }
1254
1255 int
1256 puffs_rmdir(void *v)
1257 {
1258 struct vop_rmdir_args /* {
1259 const struct vnodeop_desc *a_desc;
1260 struct vnode *a_dvp;
1261 struct vnode *a_vp;
1262 struct componentname *a_cnp;
1263 } */ *ap = v;
1264 struct puffs_mount *pmp = MPTOPUFFSMP(ap->a_dvp->v_mount);
1265 int error;
1266
1267 PUFFS_VNREQ(rmdir);
1268
1269 rmdir_arg.pvnr_cookie_targ = VPTOPNC(ap->a_vp);
1270 puffs_makecn(&rmdir_arg.pvnr_cn, &rmdir_arg.pvnr_cn_cred,
1271 &rmdir_arg.pvnr_cn_cid, ap->a_cnp, PUFFS_USE_FULLPNBUF(pmp));
1272
1273 error = puffs_vntouser(pmp, PUFFS_VN_RMDIR,
1274 &rmdir_arg, sizeof(rmdir_arg), 0, ap->a_dvp, ap->a_vp);
1275
1276 /* XXX: some call cache_purge() *for both vnodes* here, investigate */
1277
1278 vput(ap->a_dvp);
1279 vput(ap->a_vp);
1280
1281 return error;
1282 }
1283
1284 int
1285 puffs_link(void *v)
1286 {
1287 struct vop_link_args /* {
1288 const struct vnodeop_desc *a_desc;
1289 struct vnode *a_dvp;
1290 struct vnode *a_vp;
1291 struct componentname *a_cnp;
1292 }*/ *ap = v;
1293 struct puffs_mount *pmp = MPTOPUFFSMP(ap->a_dvp->v_mount);
1294 int error;
1295
1296 PUFFS_VNREQ(link);
1297
1298 link_arg.pvnr_cookie_targ = VPTOPNC(ap->a_vp);
1299 puffs_makecn(&link_arg.pvnr_cn, &link_arg.pvnr_cn_cred,
1300 &link_arg.pvnr_cn_cid, ap->a_cnp, PUFFS_USE_FULLPNBUF(pmp));
1301
1302 error = puffs_vntouser(pmp, PUFFS_VN_LINK,
1303 &link_arg, sizeof(link_arg), 0, ap->a_dvp, ap->a_vp);
1304
1305 /*
1306 * XXX: stay in touch with the cache. I don't like this, but
1307 * don't have a better solution either. See also puffs_rename().
1308 */
1309 if (error == 0)
1310 puffs_updatenode(ap->a_vp, PUFFS_UPDATECTIME);
1311
1312 vput(ap->a_dvp);
1313
1314 return error;
1315 }
1316
1317 int
1318 puffs_symlink(void *v)
1319 {
1320 struct vop_symlink_args /* {
1321 const struct vnodeop_desc *a_desc;
1322 struct vnode *a_dvp;
1323 struct vnode **a_vpp;
1324 struct componentname *a_cnp;
1325 struct vattr *a_vap;
1326 char *a_target;
1327 }*/ *ap = v;
1328 struct puffs_mount *pmp = MPTOPUFFSMP(ap->a_dvp->v_mount);
1329 struct puffs_vnreq_symlink *symlink_argp;
1330 int error;
1331
1332 *ap->a_vpp = NULL;
1333
1334 symlink_argp = malloc(sizeof(struct puffs_vnreq_symlink),
1335 M_PUFFS, M_ZERO | M_WAITOK);
1336 puffs_makecn(&symlink_argp->pvnr_cn, &symlink_argp->pvnr_cn_cred,
1337 &symlink_argp->pvnr_cn_cid, ap->a_cnp, PUFFS_USE_FULLPNBUF(pmp));
1338 symlink_argp->pvnr_va = *ap->a_vap;
1339 (void)strlcpy(symlink_argp->pvnr_link, ap->a_target,
1340 sizeof(symlink_argp->pvnr_link));
1341
1342 error = puffs_vntouser(pmp, PUFFS_VN_SYMLINK,
1343 symlink_argp, sizeof(*symlink_argp), 0, ap->a_dvp, NULL);
1344 if (error)
1345 goto out;
1346
1347 error = puffs_newnode(ap->a_dvp->v_mount, ap->a_dvp, ap->a_vpp,
1348 symlink_argp->pvnr_newnode, ap->a_cnp, VLNK, 0);
1349
1350 out:
1351 free(symlink_argp, M_PUFFS);
1352 if (error || (ap->a_cnp->cn_flags & SAVESTART) == 0)
1353 PNBUF_PUT(ap->a_cnp->cn_pnbuf);
1354 vput(ap->a_dvp);
1355
1356 return error;
1357 }
1358
1359 int
1360 puffs_readlink(void *v)
1361 {
1362 struct vop_readlink_args /* {
1363 const struct vnodeop_desc *a_desc;
1364 struct vnode *a_vp;
1365 struct uio *a_uio;
1366 kauth_cred_t a_cred;
1367 } */ *ap = v;
1368 size_t linklen;
1369 int error;
1370
1371 PUFFS_VNREQ(readlink);
1372
1373 puffs_credcvt(&readlink_arg.pvnr_cred, ap->a_cred);
1374 linklen = sizeof(readlink_arg.pvnr_link);
1375 readlink_arg.pvnr_linklen = linklen;
1376
1377 error = puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount),
1378 PUFFS_VN_READLINK, &readlink_arg, sizeof(readlink_arg), 0,
1379 ap->a_vp, NULL);
1380 if (error)
1381 return error;
1382
1383 /* bad bad user file server */
1384 if (readlink_arg.pvnr_linklen > linklen)
1385 return EINVAL;
1386
1387 return uiomove(&readlink_arg.pvnr_link, readlink_arg.pvnr_linklen,
1388 ap->a_uio);
1389 }
1390
1391 int
1392 puffs_rename(void *v)
1393 {
1394 struct vop_rename_args /* {
1395 const struct vnodeop_desc *a_desc;
1396 struct vnode *a_fdvp;
1397 struct vnode *a_fvp;
1398 struct componentname *a_fcnp;
1399 struct vnode *a_tdvp;
1400 struct vnode *a_tvp;
1401 struct componentname *a_tcnp;
1402 }*/ *ap = v;
1403 struct puffs_vnreq_rename *rename_argp = NULL;
1404 struct puffs_mount *pmp = MPTOPUFFSMP(ap->a_fdvp->v_mount);
1405 int error;
1406
1407 if (ap->a_fvp->v_mount != ap->a_tdvp->v_mount)
1408 ERROUT(EXDEV);
1409
1410 rename_argp = malloc(sizeof(struct puffs_vnreq_rename),
1411 M_PUFFS, M_WAITOK | M_ZERO);
1412
1413 rename_argp->pvnr_cookie_src = VPTOPNC(ap->a_fvp);
1414 rename_argp->pvnr_cookie_targdir = VPTOPNC(ap->a_tdvp);
1415 if (ap->a_tvp)
1416 rename_argp->pvnr_cookie_targ = VPTOPNC(ap->a_tvp);
1417 else
1418 rename_argp->pvnr_cookie_targ = NULL;
1419 puffs_makecn(&rename_argp->pvnr_cn_src,
1420 &rename_argp->pvnr_cn_src_cred, &rename_argp->pvnr_cn_src_cid,
1421 ap->a_fcnp, PUFFS_USE_FULLPNBUF(pmp));
1422 puffs_makecn(&rename_argp->pvnr_cn_targ,
1423 &rename_argp->pvnr_cn_targ_cred, &rename_argp->pvnr_cn_targ_cid,
1424 ap->a_tcnp, PUFFS_USE_FULLPNBUF(pmp));
1425
1426 error = puffs_vntouser(pmp, PUFFS_VN_RENAME,
1427 rename_argp, sizeof(*rename_argp), 0, ap->a_fdvp, NULL); /* XXX */
1428
1429 /*
1430 * XXX: stay in touch with the cache. I don't like this, but
1431 * don't have a better solution either. See also puffs_link().
1432 */
1433 if (error == 0)
1434 puffs_updatenode(ap->a_fvp, PUFFS_UPDATECTIME);
1435
1436 out:
1437 if (rename_argp)
1438 free(rename_argp, M_PUFFS);
1439 if (ap->a_tvp != NULL)
1440 vput(ap->a_tvp);
1441 if (ap->a_tdvp == ap->a_tvp)
1442 vrele(ap->a_tdvp);
1443 else
1444 vput(ap->a_tdvp);
1445
1446 vrele(ap->a_fdvp);
1447 vrele(ap->a_fvp);
1448
1449 return error;
1450 }
1451
1452 #define RWARGS(cont, iofl, move, offset, creds) \
1453 (cont)->pvnr_ioflag = (iofl); \
1454 (cont)->pvnr_resid = (move); \
1455 (cont)->pvnr_offset = (offset); \
1456 puffs_credcvt(&(cont)->pvnr_cred, creds)
1457
1458 int
1459 puffs_read(void *v)
1460 {
1461 struct vop_read_args /* {
1462 const struct vnodeop_desc *a_desc;
1463 struct vnode *a_vp;
1464 struct uio *a_uio;
1465 int a_ioflag;
1466 kauth_cred_t a_cred;
1467 } */ *ap = v;
1468 struct puffs_vnreq_read *read_argp;
1469 struct puffs_mount *pmp;
1470 struct vnode *vp;
1471 struct uio *uio;
1472 void *win;
1473 size_t tomove, argsize;
1474 vsize_t bytelen;
1475 int error, ubcflags;
1476
1477 uio = ap->a_uio;
1478 vp = ap->a_vp;
1479 read_argp = NULL;
1480 error = 0;
1481 pmp = MPTOPUFFSMP(vp->v_mount);
1482
1483 /* std sanity */
1484 if (uio->uio_resid == 0)
1485 return 0;
1486 if (uio->uio_offset < 0)
1487 return EINVAL;
1488
1489 if (vp->v_type == VREG && PUFFS_USE_PAGECACHE(pmp)) {
1490 const int advice = IO_ADV_DECODE(ap->a_ioflag);
1491
1492 ubcflags = 0;
1493 if (UBC_WANT_UNMAP(vp))
1494 ubcflags = UBC_UNMAP;
1495
1496 while (uio->uio_resid > 0) {
1497 bytelen = MIN(uio->uio_resid,
1498 vp->v_size - uio->uio_offset);
1499 if (bytelen == 0)
1500 break;
1501
1502 win = ubc_alloc(&vp->v_uobj, uio->uio_offset,
1503 &bytelen, advice, UBC_READ);
1504 error = uiomove(win, bytelen, uio);
1505 ubc_release(win, ubcflags);
1506 if (error)
1507 break;
1508 }
1509
1510 if ((vp->v_mount->mnt_flag & MNT_NOATIME) == 0)
1511 puffs_updatenode(vp, PUFFS_UPDATEATIME);
1512 } else {
1513 /*
1514 * in case it's not a regular file or we're operating
1515 * uncached, do read in the old-fashioned style,
1516 * i.e. explicit read operations
1517 */
1518
1519 tomove = PUFFS_TOMOVE(uio->uio_resid, pmp);
1520 argsize = sizeof(struct puffs_vnreq_read);
1521 read_argp = malloc(argsize + tomove,
1522 M_PUFFS, M_WAITOK | M_ZERO);
1523
1524 error = 0;
1525 while (uio->uio_resid > 0) {
1526 tomove = PUFFS_TOMOVE(uio->uio_resid, pmp);
1527 RWARGS(read_argp, ap->a_ioflag, tomove,
1528 uio->uio_offset, ap->a_cred);
1529
1530 error = puffs_vntouser(pmp, PUFFS_VN_READ,
1531 read_argp, argsize, tomove,
1532 ap->a_vp, NULL);
1533 if (error)
1534 break;
1535
1536 if (read_argp->pvnr_resid > tomove) {
1537 error = EINVAL;
1538 break;
1539 }
1540
1541 error = uiomove(read_argp->pvnr_data,
1542 tomove - read_argp->pvnr_resid, uio);
1543
1544 /*
1545 * in case the file is out of juice, resid from
1546 * userspace is != 0. and the error-case is
1547 * quite obvious
1548 */
1549 if (error || read_argp->pvnr_resid)
1550 break;
1551 }
1552 }
1553
1554 if (read_argp)
1555 free(read_argp, M_PUFFS);
1556 return error;
1557 }
1558
1559 /*
1560 * XXX: in case of a failure, this leaves uio in a bad state.
1561 * We could theoretically copy the uio and iovecs and "replay"
1562 * them the right amount after the userspace trip, but don't
1563 * bother for now.
1564 */
1565 int
1566 puffs_write(void *v)
1567 {
1568 struct vop_write_args /* {
1569 const struct vnodeop_desc *a_desc;
1570 struct vnode *a_vp;
1571 struct uio *a_uio;
1572 int a_ioflag;
1573 kauth_cred_t a_cred;
1574 } */ *ap = v;
1575 struct puffs_vnreq_write *write_argp;
1576 struct puffs_mount *pmp;
1577 struct uio *uio;
1578 struct vnode *vp;
1579 size_t tomove, argsize;
1580 off_t oldoff, newoff, origoff;
1581 vsize_t bytelen;
1582 int error, uflags;
1583 int ubcflags;
1584
1585 vp = ap->a_vp;
1586 uio = ap->a_uio;
1587 error = uflags = 0;
1588 write_argp = NULL;
1589 pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
1590
1591 if (vp->v_type == VREG && PUFFS_USE_PAGECACHE(pmp)) {
1592 ubcflags = UBC_WRITE | UBC_PARTIALOK;
1593 if (UBC_WANT_UNMAP(vp))
1594 ubcflags = UBC_UNMAP;
1595
1596 /*
1597 * userspace *should* be allowed to control this,
1598 * but with UBC it's a bit unclear how to handle it
1599 */
1600 if (ap->a_ioflag & IO_APPEND)
1601 uio->uio_offset = vp->v_size;
1602
1603 origoff = uio->uio_offset;
1604 while (uio->uio_resid > 0) {
1605 uflags |= PUFFS_UPDATECTIME;
1606 uflags |= PUFFS_UPDATEMTIME;
1607 oldoff = uio->uio_offset;
1608 bytelen = uio->uio_resid;
1609
1610 newoff = oldoff + bytelen;
1611 if (vp->v_size < newoff) {
1612 uvm_vnp_setwritesize(vp, newoff);
1613 }
1614 error = ubc_uiomove(&vp->v_uobj, uio, bytelen,
1615 ubcflags);
1616
1617 /*
1618 * In case of a ubc_uiomove() error,
1619 * opt to not extend the file at all and
1620 * return an error. Otherwise, if we attempt
1621 * to clear the memory we couldn't fault to,
1622 * we might generate a kernel page fault.
1623 */
1624 if (vp->v_size < newoff) {
1625 if (error == 0) {
1626 uflags |= PUFFS_UPDATESIZE;
1627 uvm_vnp_setsize(vp, newoff);
1628 } else {
1629 uvm_vnp_setwritesize(vp, vp->v_size);
1630 }
1631 }
1632 if (error)
1633 break;
1634
1635 /*
1636 * If we're writing large files, flush to file server
1637 * every 64k. Otherwise we can very easily exhaust
1638 * kernel and user memory, as the file server cannot
1639 * really keep up with our writing speed.
1640 *
1641 * Note: this does *NOT* honor MNT_ASYNC, because
1642 * that gives userland too much say in the kernel.
1643 */
1644 if (oldoff >> 16 != uio->uio_offset >> 16) {
1645 simple_lock(&vp->v_interlock);
1646 error = VOP_PUTPAGES(vp, oldoff & ~0xffff,
1647 uio->uio_offset & ~0xffff,
1648 PGO_CLEANIT | PGO_SYNCIO);
1649 if (error)
1650 break;
1651 }
1652 }
1653
1654 /* synchronous I/O? */
1655 if (error == 0 && ap->a_ioflag & IO_SYNC) {
1656 simple_lock(&vp->v_interlock);
1657 error = VOP_PUTPAGES(vp, trunc_page(origoff),
1658 round_page(uio->uio_offset),
1659 PGO_CLEANIT | PGO_SYNCIO);
1660
1661 /* write though page cache? */
1662 } else if (error == 0 && pmp->pmp_flags & PUFFS_KFLAG_WTCACHE) {
1663 simple_lock(&vp->v_interlock);
1664 error = VOP_PUTPAGES(vp, trunc_page(origoff),
1665 round_page(uio->uio_offset), PGO_CLEANIT);
1666 }
1667
1668 puffs_updatenode(vp, uflags);
1669 } else {
1670 /* tomove is non-increasing */
1671 tomove = PUFFS_TOMOVE(uio->uio_resid, pmp);
1672 argsize = sizeof(struct puffs_vnreq_write) + tomove;
1673 write_argp = malloc(argsize, M_PUFFS, M_WAITOK | M_ZERO);
1674
1675 while (uio->uio_resid > 0) {
1676 /* move data to buffer */
1677 tomove = PUFFS_TOMOVE(uio->uio_resid, pmp);
1678 RWARGS(write_argp, ap->a_ioflag, tomove,
1679 uio->uio_offset, ap->a_cred);
1680 error = uiomove(write_argp->pvnr_data, tomove, uio);
1681 if (error)
1682 break;
1683
1684 /* move buffer to userspace */
1685 error = puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount),
1686 PUFFS_VN_WRITE, write_argp, argsize, 0,
1687 ap->a_vp, NULL);
1688 if (error)
1689 break;
1690
1691 if (write_argp->pvnr_resid > tomove) {
1692 error = EINVAL;
1693 break;
1694 }
1695
1696 /* adjust file size */
1697 if (vp->v_size < uio->uio_offset)
1698 uvm_vnp_setsize(vp, uio->uio_offset);
1699
1700 /* didn't move everything? bad userspace. bail */
1701 if (write_argp->pvnr_resid != 0) {
1702 error = EIO;
1703 break;
1704 }
1705 }
1706 }
1707
1708 if (write_argp)
1709 free(write_argp, M_PUFFS);
1710 return error;
1711 }
1712
1713 static int puffs_fcnioctl(struct vop_ioctl_args * /*XXX*/, int);
1714
1715 #define FCNIOCTL_ARG_MAX 1<<16
1716 int
1717 puffs_fcnioctl(struct vop_ioctl_args *ap, int puffsop)
1718 {
1719
1720 /* currently not supported */
1721 return EOPNOTSUPP;
1722 #if 0
1723 /* struct vop_ioctl_args {
1724 const struct vnodeop_desc *a_desc;
1725 struct vnode *a_vp;
1726 u_long a_command;
1727 void *a_data;
1728 int a_fflag;
1729 kauth_cred_t a_cred;
1730 struct lwp *a_l;
1731 }*ap = v; */
1732 struct puffs_mount *pmp;
1733 struct puffs_sizepark pspark;
1734 void *kernbuf;
1735 size_t copylen;
1736 int error;
1737
1738 PUFFS_VNREQ(fcnioctl);
1739
1740 /*
1741 * Since this op gives the filesystem (almost) complete control on
1742 * how much it is allowed to copy from the calling process
1743 * address space, do not enable it by default, since it would
1744 * be a whopping security hole.
1745 */
1746 pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
1747 if ((pmp->pmp_flags & PUFFS_KFLAG_ALLOWCTL) == 0)
1748 return EINVAL; /* only shoe that fits */
1749
1750 /* fill in sizereq and store it */
1751 pspark.pkso_reqid = puffs_getreqid(pmp);
1752 pspark.pkso_reqtype = PUFFS_SIZEOPREQ_BUF_IN;
1753 pspark.pkso_copybuf = ap->a_data;
1754 pspark.pkso_bufsize = FCNIOCTL_ARG_MAX;
1755 TAILQ_INSERT_TAIL(&pmp->pmp_req_sizepark, &pspark, pkso_entries);
1756
1757 /* then fill in actual request and shoot it off */
1758 fcnioctl_arg.pvnr_command = ap->a_command;
1759 fcnioctl_arg.pvnr_fflag = ap->a_fflag;
1760 puffs_credcvt(&fcnioctl_arg.pvnr_cred, ap->a_cred);
1761 fcnioctl_arg.pvnr_pid = puffs_lwp2pid(ap->a_l);
1762
1763 error = puffs_vntouser_req(MPTOPUFFSMP(ap->a_vp->v_mount), puffsop,
1764 &fcnioctl_arg, sizeof(fcnioctl_arg), 0, ap->a_vp,
1765 pspark.pkso_reqid, ap->a_vp, NULL);
1766
1767 /* if we don't need to copy data, we're done */
1768 if (error || !fcnioctl_arg.pvnr_copyback)
1769 return error;
1770
1771 copylen = MIN(FCNIOCTL_ARG_MAX, fcnioctl_arg.pvnr_datalen);
1772 kernbuf = malloc(copylen, M_PUFFS, M_WAITOK);
1773 error = copyin(fcnioctl_arg.pvnr_data, kernbuf, copylen);
1774 if (error)
1775 goto out;
1776 error = copyout(kernbuf, ap->a_data, copylen);
1777
1778 out:
1779 free(kernbuf, M_PUFFS);
1780 return error;
1781 #endif
1782 }
1783
1784 int
1785 puffs_ioctl(void *v)
1786 {
1787
1788 return puffs_fcnioctl(v, PUFFS_VN_IOCTL);
1789 }
1790
1791 int
1792 puffs_fcntl(void *v)
1793 {
1794
1795 return puffs_fcnioctl(v, PUFFS_VN_FCNTL);
1796 }
1797
1798 int
1799 puffs_print(void *v)
1800 {
1801 struct vop_print_args /* {
1802 struct vnode *a_vp;
1803 } */ *ap = v;
1804 struct puffs_mount *pmp;
1805 struct vnode *vp = ap->a_vp;
1806 struct puffs_node *pn = vp->v_data;
1807
1808 PUFFS_VNREQ(print);
1809
1810 pmp = MPTOPUFFSMP(vp->v_mount);
1811
1812 /* kernel portion */
1813 printf("tag VT_PUFFS, vnode %p, puffs node: %p,\n"
1814 " userspace cookie: %p\n", vp, pn, pn->pn_cookie);
1815 if (vp->v_type == VFIFO)
1816 fifo_printinfo(vp);
1817 lockmgr_printinfo(&vp->v_lock);
1818
1819 /* userspace portion */
1820 if (EXISTSOP(pmp, PRINT))
1821 puffs_vntouser(pmp, PUFFS_VN_PRINT,
1822 &print_arg, sizeof(print_arg), 0, ap->a_vp, NULL);
1823
1824 return 0;
1825 }
1826
1827 int
1828 puffs_pathconf(void *v)
1829 {
1830 struct vop_pathconf_args /* {
1831 const struct vnodeop_desc *a_desc;
1832 struct vnode *a_vp;
1833 int a_name;
1834 register_t *a_retval;
1835 } */ *ap = v;
1836 int error;
1837
1838 PUFFS_VNREQ(pathconf);
1839
1840 pathconf_arg.pvnr_name = ap->a_name;
1841
1842 error = puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount),
1843 PUFFS_VN_PATHCONF, &pathconf_arg, sizeof(pathconf_arg), 0,
1844 ap->a_vp, NULL);
1845 if (error)
1846 return error;
1847
1848 *ap->a_retval = pathconf_arg.pvnr_retval;
1849
1850 return 0;
1851 }
1852
1853 int
1854 puffs_advlock(void *v)
1855 {
1856 struct vop_advlock_args /* {
1857 const struct vnodeop_desc *a_desc;
1858 struct vnode *a_vp;
1859 void *a_id;
1860 int a_op;
1861 struct flock *a_fl;
1862 int a_flags;
1863 } */ *ap = v;
1864 int error;
1865
1866 PUFFS_VNREQ(advlock);
1867
1868 error = copyin(ap->a_fl, &advlock_arg.pvnr_fl, sizeof(struct flock));
1869 if (error)
1870 return error;
1871 advlock_arg.pvnr_id = ap->a_id;
1872 advlock_arg.pvnr_op = ap->a_op;
1873 advlock_arg.pvnr_flags = ap->a_flags;
1874
1875 return puffs_vntouser(MPTOPUFFSMP(ap->a_vp->v_mount), PUFFS_VN_ADVLOCK,
1876 &advlock_arg, sizeof(advlock_arg), 0, ap->a_vp, NULL);
1877 }
1878
1879 #define BIOASYNC(bp) (bp->b_flags & B_ASYNC)
1880 #define BIOREAD(bp) (bp->b_flags & B_READ)
1881 #define BIOWRITE(bp) ((bp->b_flags & B_READ) == 0)
1882
1883 /*
1884 * This maps itself to PUFFS_VN_READ/WRITE for data transfer.
1885 */
1886 int
1887 puffs_strategy(void *v)
1888 {
1889 struct vop_strategy_args /* {
1890 const struct vnodeop_desc *a_desc;
1891 struct vnode *a_vp;
1892 struct buf *a_bp;
1893 } */ *ap = v;
1894 struct puffs_mount *pmp;
1895 struct vnode *vp = ap->a_vp;
1896 struct puffs_node *pn;
1897 struct puffs_vnreq_readwrite *rw_argp = NULL;
1898 struct buf *bp;
1899 size_t argsize;
1900 size_t tomove, moved;
1901 int error, dofaf;
1902
1903 pmp = MPTOPUFFSMP(vp->v_mount);
1904 bp = ap->a_bp;
1905 error = 0;
1906 dofaf = 0;
1907 pn = VPTOPP(vp);
1908
1909 if ((BIOREAD(bp) && !EXISTSOP(pmp, READ))
1910 || (BIOWRITE(bp) && !EXISTSOP(pmp, WRITE)))
1911 ERROUT(EOPNOTSUPP);
1912
1913 /*
1914 * Short-circuit optimization: don't flush buffer in between
1915 * VOP_INACTIVE and VOP_RECLAIM in case the node has no references.
1916 */
1917 if (pn->pn_stat & PNODE_DYING) {
1918 KASSERT(BIOWRITE(bp));
1919 bp->b_resid = 0;
1920 goto out;
1921 }
1922
1923 #ifdef DIAGNOSTIC
1924 if (bp->b_bcount > pmp->pmp_req_maxsize - PUFFS_REQSTRUCT_MAX)
1925 panic("puffs_strategy: wildly inappropriate buf bcount %d",
1926 bp->b_bcount);
1927 #endif
1928
1929 /*
1930 * See explanation for the necessity of a FAF in puffs_fsync.
1931 *
1932 * Also, do FAF in case we're suspending.
1933 * See puffs_vfsops.c:pageflush()
1934 */
1935 if (BIOWRITE(bp)) {
1936 simple_lock(&vp->v_interlock);
1937 if (vp->v_flag & VXLOCK)
1938 dofaf = 1;
1939 if (pn->pn_stat & PNODE_SUSPEND)
1940 dofaf = 1;
1941 simple_unlock(&vp->v_interlock);
1942 }
1943
1944 if (BIOASYNC(bp))
1945 dofaf = 1;
1946
1947 #ifdef DIAGNOSTIC
1948 if (curproc == uvm.pagedaemon_proc)
1949 KASSERT(dofaf);
1950 #endif
1951
1952 /* allocate transport structure */
1953 tomove = PUFFS_TOMOVE(bp->b_bcount, pmp);
1954 argsize = sizeof(struct puffs_vnreq_readwrite);
1955 rw_argp = malloc(argsize + tomove, M_PUFFS,
1956 M_ZERO | (dofaf ? M_NOWAIT : M_WAITOK));
1957 if (rw_argp == NULL)
1958 ERROUT(ENOMEM);
1959 RWARGS(rw_argp, 0, tomove, bp->b_blkno << DEV_BSHIFT, FSCRED);
1960
1961 /* 2x2 cases: read/write, faf/nofaf */
1962 if (BIOREAD(bp)) {
1963 if (dofaf) {
1964 puffs_vntouser_call(pmp, PUFFS_VN_READ, rw_argp,
1965 argsize, tomove, puffs_parkdone_asyncbioread,
1966 bp, vp, NULL);
1967 } else {
1968 error = puffs_vntouser(pmp, PUFFS_VN_READ,
1969 rw_argp, argsize, tomove, vp, NULL);
1970 if (error)
1971 goto out;
1972
1973 if (rw_argp->pvnr_resid > tomove)
1974 ERROUT(EINVAL);
1975
1976 moved = tomove - rw_argp->pvnr_resid;
1977
1978 (void)memcpy(bp->b_data, rw_argp->pvnr_data, moved);
1979 bp->b_resid = bp->b_bcount - moved;
1980 }
1981 } else {
1982 /*
1983 * make pages read-only before we write them if we want
1984 * write caching info
1985 */
1986 if (PUFFS_WCACHEINFO(pmp)) {
1987 struct uvm_object *uobj = &vp->v_uobj;
1988 int npages = (bp->b_bcount + PAGE_SIZE-1) >> PAGE_SHIFT;
1989 struct vm_page *vmp;
1990 int i;
1991
1992 for (i = 0; i < npages; i++) {
1993 vmp= uvm_pageratop((vaddr_t)bp->b_data
1994 + (i << PAGE_SHIFT));
1995 DPRINTF(("puffs_strategy: write-protecting "
1996 "vp %p page %p, offset %" PRId64"\n",
1997 vp, vmp, vmp->offset));
1998 simple_lock(&uobj->vmobjlock);
1999 vmp->flags |= PG_RDONLY;
2000 pmap_page_protect(vmp, VM_PROT_READ);
2001 simple_unlock(&uobj->vmobjlock);
2002 }
2003 }
2004
2005 (void)memcpy(&rw_argp->pvnr_data, bp->b_data, tomove);
2006 if (dofaf) {
2007 /*
2008 * assume FAF moves everything. frankly, we don't
2009 * really have a choice.
2010 */
2011 puffs_vntouser_faf(MPTOPUFFSMP(vp->v_mount),
2012 PUFFS_VN_WRITE, rw_argp, argsize + tomove, vp);
2013 bp->b_resid = bp->b_bcount - tomove;
2014 } else {
2015 error = puffs_vntouser(MPTOPUFFSMP(vp->v_mount),
2016 PUFFS_VN_WRITE, rw_argp, argsize + tomove,
2017 0, vp, NULL);
2018 if (error)
2019 goto out;
2020
2021 moved = tomove - rw_argp->pvnr_resid;
2022 if (rw_argp->pvnr_resid > tomove)
2023 ERROUT(EINVAL);
2024
2025 bp->b_resid = bp->b_bcount - moved;
2026 if (rw_argp->pvnr_resid != 0)
2027 ERROUT(EIO);
2028 }
2029 }
2030
2031 out:
2032 KASSERT(dofaf == 0 || error == 0 || rw_argp == NULL);
2033 if (rw_argp && !dofaf)
2034 free(rw_argp, M_PUFFS);
2035
2036 if (error) {
2037 bp->b_error = error;
2038 bp->b_flags |= B_ERROR;
2039 }
2040
2041 if (error || !(BIOREAD(bp) && BIOASYNC(bp)))
2042 biodone(bp);
2043
2044 return error;
2045 }
2046
2047 int
2048 puffs_mmap(void *v)
2049 {
2050 struct vop_mmap_args /* {
2051 const struct vnodeop_desc *a_desc;
2052 struct vnode *a_vp;
2053 int a_fflags;
2054 kauth_cred_t a_cred;
2055 struct lwp *a_l;
2056 } */ *ap = v;
2057 struct puffs_mount *pmp;
2058 int error;
2059
2060 PUFFS_VNREQ(mmap);
2061
2062 pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
2063
2064 if (!PUFFS_USE_PAGECACHE(pmp))
2065 return genfs_eopnotsupp(v);
2066
2067 if (EXISTSOP(pmp, MMAP)) {
2068 mmap_arg.pvnr_fflags = ap->a_fflags;
2069 puffs_credcvt(&mmap_arg.pvnr_cred, ap->a_cred);
2070 puffs_cidcvt(&mmap_arg.pvnr_cid, ap->a_l);
2071
2072 error = puffs_vntouser(pmp, PUFFS_VN_MMAP,
2073 &mmap_arg, sizeof(mmap_arg), 0,
2074 ap->a_vp, NULL);
2075 } else {
2076 error = genfs_mmap(v);
2077 }
2078
2079 return error;
2080 }
2081
2082
2083 /*
2084 * The rest don't get a free trip to userspace and back, they
2085 * have to stay within the kernel.
2086 */
2087
2088 /*
2089 * bmap doesn't really make any sense for puffs, so just 1:1 map it.
2090 * well, maybe somehow, somewhere, some day ....
2091 */
2092 int
2093 puffs_bmap(void *v)
2094 {
2095 struct vop_bmap_args /* {
2096 const struct vnodeop_desc *a_desc;
2097 struct vnode *a_vp;
2098 daddr_t a_bn;
2099 struct vnode **a_vpp;
2100 daddr_t *a_bnp;
2101 int *a_runp;
2102 } */ *ap = v;
2103 struct puffs_mount *pmp;
2104
2105 pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
2106
2107 if (ap->a_vpp)
2108 *ap->a_vpp = ap->a_vp;
2109 if (ap->a_bnp)
2110 *ap->a_bnp = ap->a_bn;
2111 if (ap->a_runp)
2112 *ap->a_runp
2113 = (PUFFS_TOMOVE(pmp->pmp_req_maxsize, pmp)>>DEV_BSHIFT) - 1;
2114
2115 return 0;
2116 }
2117
2118 /*
2119 * Handle getpages faults in puffs. We let genfs_getpages() do most
2120 * of the dirty work, but we come in this route to do accounting tasks.
2121 * If the user server has specified functions for cache notifications
2122 * about reads and/or writes, we record which type of operation we got,
2123 * for which page range, and proceed to issue a FAF notification to the
2124 * server about it.
2125 */
2126 int
2127 puffs_getpages(void *v)
2128 {
2129 struct vop_getpages_args /* {
2130 const struct vnodeop_desc *a_desc;
2131 struct vnode *a_vp;
2132 voff_t a_offset;
2133 struct vm_page **a_m;
2134 int *a_count;
2135 int a_centeridx;
2136 vm_prot_t a_access_type;
2137 int a_advice;
2138 int a_flags;
2139 } */ *ap = v;
2140 struct puffs_mount *pmp;
2141 struct vnode *vp;
2142 struct vm_page **pgs;
2143 struct puffs_cacheinfo *pcinfo = NULL;
2144 struct puffs_cacherun *pcrun;
2145 void *parkmem = NULL;
2146 size_t runsizes;
2147 int i, npages, si, streakon;
2148 int error, locked, write;
2149
2150 pmp = MPTOPUFFSMP(ap->a_vp->v_mount);
2151 npages = *ap->a_count;
2152 pgs = ap->a_m;
2153 vp = ap->a_vp;
2154 locked = (ap->a_flags & PGO_LOCKED) != 0;
2155 write = (ap->a_access_type & VM_PROT_WRITE) != 0;
2156
2157 /* ccg xnaht - gets Wuninitialized wrong */
2158 pcrun = NULL;
2159 runsizes = 0;
2160
2161 if (write && PUFFS_WCACHEINFO(pmp)) {
2162 /* allocate worst-case memory */
2163 runsizes = ((npages / 2) + 1) * sizeof(struct puffs_cacherun);
2164 pcinfo = malloc(sizeof(struct puffs_cacheinfo) + runsizes,
2165 M_PUFFS, M_ZERO | locked ? M_NOWAIT : M_WAITOK);
2166
2167 /*
2168 * can't block if we're locked and can't mess up caching
2169 * information for fs server. so come back later, please
2170 */
2171 if (pcinfo == NULL)
2172 ERROUT(ENOMEM);
2173
2174 parkmem = puffs_park_alloc(locked == 0);
2175 if (parkmem == NULL)
2176 ERROUT(ENOMEM);
2177
2178 pcrun = pcinfo->pcache_runs;
2179 }
2180
2181 error = genfs_getpages(v);
2182 if (error)
2183 goto out;
2184
2185 if (PUFFS_WCACHEINFO(pmp) == 0)
2186 goto out;
2187
2188 /*
2189 * Let's see whose fault it was and inform the user server of
2190 * possibly read/written pages. Map pages from read faults
2191 * strictly read-only, since otherwise we might miss info on
2192 * when the page is actually write-faulted to.
2193 */
2194 if (!locked)
2195 simple_lock(&vp->v_uobj.vmobjlock);
2196 for (i = 0, si = 0, streakon = 0; i < npages; i++) {
2197 if (pgs[i] == NULL || pgs[i] == PGO_DONTCARE) {
2198 if (streakon && write) {
2199 streakon = 0;
2200 pcrun[si].pcache_runend
2201 = trunc_page(pgs[i]->offset) + PAGE_MASK;
2202 si++;
2203 }
2204 continue;
2205 }
2206 if (streakon == 0 && write) {
2207 streakon = 1;
2208 pcrun[si].pcache_runstart = pgs[i]->offset;
2209 }
2210
2211 if (!write)
2212 pgs[i]->flags |= PG_RDONLY;
2213 }
2214 /* was the last page part of our streak? */
2215 if (streakon) {
2216 pcrun[si].pcache_runend
2217 = trunc_page(pgs[i-1]->offset) + PAGE_MASK;
2218 si++;
2219 }
2220 if (!locked)
2221 simple_unlock(&vp->v_uobj.vmobjlock);
2222
2223 KASSERT(si <= (npages / 2) + 1);
2224
2225 /* send results to userspace */
2226 if (write)
2227 puffs_cacheop(pmp, parkmem, pcinfo,
2228 sizeof(struct puffs_cacheinfo) + runsizes, VPTOPNC(vp));
2229
2230 out:
2231 if (error) {
2232 if (pcinfo != NULL)
2233 free(pcinfo, M_PUFFS);
2234 if (parkmem != NULL)
2235 puffs_park_release(parkmem, 1);
2236 }
2237
2238 return error;
2239 }
2240
2241 int
2242 puffs_lock(void *v)
2243 {
2244 struct vop_lock_args /* {
2245 struct vnode *a_vp;
2246 int a_flags;
2247 }*/ *ap = v;
2248 struct vnode *vp = ap->a_vp;
2249 struct mount *mp = vp->v_mount;
2250
2251 #if 0
2252 DPRINTF(("puffs_lock: lock %p, args 0x%x\n", vp, ap->a_flags));
2253 #endif
2254
2255 /*
2256 * XXX: this avoids deadlocking when we're suspending.
2257 * e.g. some ops holding the vnode lock might be blocked for
2258 * the vfs transaction lock so we'd deadlock.
2259 *
2260 * Now once again this is skating on the thin ice of modern life,
2261 * since we are breaking the consistency guarantee provided
2262 * _to the user server_ by vnode locking. Hopefully this will
2263 * get fixed soon enough by getting rid of the dependency on
2264 * vnode locks alltogether.
2265 */
2266 if (fstrans_is_owner(mp) && fstrans_getstate(mp) == FSTRANS_SUSPENDING){
2267 if (ap->a_flags & LK_INTERLOCK)
2268 simple_unlock(&vp->v_interlock);
2269 return 0;
2270 }
2271
2272 return lockmgr(&vp->v_lock, ap->a_flags, &vp->v_interlock);
2273 }
2274
2275 int
2276 puffs_unlock(void *v)
2277 {
2278 struct vop_unlock_args /* {
2279 struct vnode *a_vp;
2280 int a_flags;
2281 } */ *ap = v;
2282 struct vnode *vp = ap->a_vp;
2283 struct mount *mp = vp->v_mount;
2284
2285 #if 0
2286 DPRINTF(("puffs_unlock: lock %p, args 0x%x\n", vp, ap->a_flags));
2287 #endif
2288
2289 /* XXX: see puffs_lock() */
2290 if (fstrans_is_owner(mp) && fstrans_getstate(mp) == FSTRANS_SUSPENDING){
2291 if (ap->a_flags & LK_INTERLOCK)
2292 simple_unlock(&vp->v_interlock);
2293 return 0;
2294 }
2295
2296 return lockmgr(&vp->v_lock, ap->a_flags | LK_RELEASE, &vp->v_interlock);
2297 }
2298
2299 int
2300 puffs_islocked(void *v)
2301 {
2302 struct vop_islocked_args *ap = v;
2303 int rv;
2304
2305 rv = lockstatus(&ap->a_vp->v_lock);
2306 return rv;
2307 }
2308
2309 int
2310 puffs_generic(void *v)
2311 {
2312 struct vop_generic_args *ap = v;
2313
2314 (void)ap;
2315 DPRINTF(("puffs_generic: ap->a_desc = %s\n", ap->a_desc->vdesc_name));
2316
2317 return EOPNOTSUPP;
2318 }
2319
2320
2321 /*
2322 * spec & fifo. These call the miscfs spec and fifo vectors, but issue
2323 * FAF update information for the puffs node first.
2324 */
2325 int
2326 puffs_spec_read(void *v)
2327 {
2328 struct vop_read_args /* {
2329 const struct vnodeop_desc *a_desc;
2330 struct vnode *a_vp;
2331 struct uio *a_uio;
2332 int a_ioflag;
2333 kauth_cred_t a_cred;
2334 } */ *ap = v;
2335
2336 puffs_updatenode(ap->a_vp, PUFFS_UPDATEATIME);
2337 return VOCALL(spec_vnodeop_p, VOFFSET(vop_read), v);
2338 }
2339
2340 int
2341 puffs_spec_write(void *v)
2342 {
2343 struct vop_write_args /* {
2344 const struct vnodeop_desc *a_desc;
2345 struct vnode *a_vp;
2346 struct uio *a_uio;
2347 int a_ioflag;
2348 kauth_cred_t a_cred;
2349 }*/ *ap = v;
2350
2351 puffs_updatenode(ap->a_vp, PUFFS_UPDATEMTIME);
2352 return VOCALL(spec_vnodeop_p, VOFFSET(vop_write), v);
2353 }
2354
2355 int
2356 puffs_fifo_read(void *v)
2357 {
2358 struct vop_read_args /* {
2359 const struct vnodeop_desc *a_desc;
2360 struct vnode *a_vp;
2361 struct uio *a_uio;
2362 int a_ioflag;
2363 kauth_cred_t a_cred;
2364 } */ *ap = v;
2365
2366 puffs_updatenode(ap->a_vp, PUFFS_UPDATEATIME);
2367 return VOCALL(fifo_vnodeop_p, VOFFSET(vop_read), v);
2368 }
2369
2370 int
2371 puffs_fifo_write(void *v)
2372 {
2373 struct vop_write_args /* {
2374 const struct vnodeop_desc *a_desc;
2375 struct vnode *a_vp;
2376 struct uio *a_uio;
2377 int a_ioflag;
2378 kauth_cred_t a_cred;
2379 }*/ *ap = v;
2380
2381 puffs_updatenode(ap->a_vp, PUFFS_UPDATEMTIME);
2382 return VOCALL(fifo_vnodeop_p, VOFFSET(vop_write), v);
2383 }
2384