tmpfs_vnops.c revision 1.120.2.2 1 /* $NetBSD: tmpfs_vnops.c,v 1.120.2.2 2016/05/09 19:45:00 snj Exp $ */
2
3 /*
4 * Copyright (c) 2005, 2006, 2007 The NetBSD Foundation, Inc.
5 * All rights reserved.
6 *
7 * This code is derived from software contributed to The NetBSD Foundation
8 * by Julio M. Merino Vidal, developed as part of Google's Summer of Code
9 * 2005 program.
10 *
11 * Redistribution and use in source and binary forms, with or without
12 * modification, are permitted provided that the following conditions
13 * are met:
14 * 1. Redistributions of source code must retain the above copyright
15 * notice, this list of conditions and the following disclaimer.
16 * 2. Redistributions in binary form must reproduce the above copyright
17 * notice, this list of conditions and the following disclaimer in the
18 * documentation and/or other materials provided with the distribution.
19 *
20 * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
21 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
22 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
23 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
24 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
25 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
26 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
27 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
28 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
29 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
30 * POSSIBILITY OF SUCH DAMAGE.
31 */
32
33 /*
34 * tmpfs vnode interface.
35 */
36
37 #include <sys/cdefs.h>
38 __KERNEL_RCSID(0, "$NetBSD: tmpfs_vnops.c,v 1.120.2.2 2016/05/09 19:45:00 snj Exp $");
39
40 #include <sys/param.h>
41 #include <sys/dirent.h>
42 #include <sys/fcntl.h>
43 #include <sys/event.h>
44 #include <sys/malloc.h>
45 #include <sys/namei.h>
46 #include <sys/stat.h>
47 #include <sys/uio.h>
48 #include <sys/unistd.h>
49 #include <sys/vnode.h>
50 #include <sys/lockf.h>
51 #include <sys/kauth.h>
52 #include <sys/atomic.h>
53
54 #include <uvm/uvm.h>
55
56 #include <miscfs/fifofs/fifo.h>
57 #include <miscfs/genfs/genfs.h>
58 #include <fs/tmpfs/tmpfs_vnops.h>
59 #include <fs/tmpfs/tmpfs.h>
60
61 /*
62 * vnode operations vector used for files stored in a tmpfs file system.
63 */
64 int (**tmpfs_vnodeop_p)(void *);
65 const struct vnodeopv_entry_desc tmpfs_vnodeop_entries[] = {
66 { &vop_default_desc, vn_default_error },
67 { &vop_lookup_desc, tmpfs_lookup },
68 { &vop_create_desc, tmpfs_create },
69 { &vop_mknod_desc, tmpfs_mknod },
70 { &vop_open_desc, tmpfs_open },
71 { &vop_close_desc, tmpfs_close },
72 { &vop_access_desc, tmpfs_access },
73 { &vop_getattr_desc, tmpfs_getattr },
74 { &vop_setattr_desc, tmpfs_setattr },
75 { &vop_read_desc, tmpfs_read },
76 { &vop_write_desc, tmpfs_write },
77 { &vop_fallocate_desc, genfs_eopnotsupp },
78 { &vop_fdiscard_desc, genfs_eopnotsupp },
79 { &vop_ioctl_desc, tmpfs_ioctl },
80 { &vop_fcntl_desc, tmpfs_fcntl },
81 { &vop_poll_desc, tmpfs_poll },
82 { &vop_kqfilter_desc, tmpfs_kqfilter },
83 { &vop_revoke_desc, tmpfs_revoke },
84 { &vop_mmap_desc, tmpfs_mmap },
85 { &vop_fsync_desc, tmpfs_fsync },
86 { &vop_seek_desc, tmpfs_seek },
87 { &vop_remove_desc, tmpfs_remove },
88 { &vop_link_desc, tmpfs_link },
89 { &vop_rename_desc, tmpfs_rename },
90 { &vop_mkdir_desc, tmpfs_mkdir },
91 { &vop_rmdir_desc, tmpfs_rmdir },
92 { &vop_symlink_desc, tmpfs_symlink },
93 { &vop_readdir_desc, tmpfs_readdir },
94 { &vop_readlink_desc, tmpfs_readlink },
95 { &vop_abortop_desc, tmpfs_abortop },
96 { &vop_inactive_desc, tmpfs_inactive },
97 { &vop_reclaim_desc, tmpfs_reclaim },
98 { &vop_lock_desc, tmpfs_lock },
99 { &vop_unlock_desc, tmpfs_unlock },
100 { &vop_bmap_desc, tmpfs_bmap },
101 { &vop_strategy_desc, tmpfs_strategy },
102 { &vop_print_desc, tmpfs_print },
103 { &vop_pathconf_desc, tmpfs_pathconf },
104 { &vop_islocked_desc, tmpfs_islocked },
105 { &vop_advlock_desc, tmpfs_advlock },
106 { &vop_bwrite_desc, tmpfs_bwrite },
107 { &vop_getpages_desc, tmpfs_getpages },
108 { &vop_putpages_desc, tmpfs_putpages },
109 { &vop_whiteout_desc, tmpfs_whiteout },
110 { NULL, NULL }
111 };
112
113 const struct vnodeopv_desc tmpfs_vnodeop_opv_desc = {
114 &tmpfs_vnodeop_p, tmpfs_vnodeop_entries
115 };
116
117 /*
118 * tmpfs_lookup: path name traversal routine.
119 *
120 * Arguments: dvp (directory being searched), vpp (result),
121 * cnp (component name - path).
122 *
123 * => Caller holds a reference and lock on dvp.
124 * => We return looked-up vnode (vpp) locked, with a reference held.
125 */
126 int
127 tmpfs_lookup(void *v)
128 {
129 struct vop_lookup_v2_args /* {
130 struct vnode *a_dvp;
131 struct vnode **a_vpp;
132 struct componentname *a_cnp;
133 } */ *ap = v;
134 vnode_t *dvp = ap->a_dvp, **vpp = ap->a_vpp;
135 struct componentname *cnp = ap->a_cnp;
136 const bool lastcn = (cnp->cn_flags & ISLASTCN) != 0;
137 tmpfs_node_t *dnode, *tnode;
138 tmpfs_dirent_t *de;
139 int cachefound, iswhiteout;
140 int error;
141
142 KASSERT(VOP_ISLOCKED(dvp));
143
144 dnode = VP_TO_TMPFS_DIR(dvp);
145 *vpp = NULL;
146
147 /* Check accessibility of directory. */
148 error = VOP_ACCESS(dvp, VEXEC, cnp->cn_cred);
149 if (error) {
150 goto out;
151 }
152
153 /*
154 * If requesting the last path component on a read-only file system
155 * with a write operation, deny it.
156 */
157 if (lastcn && (dvp->v_mount->mnt_flag & MNT_RDONLY) != 0 &&
158 (cnp->cn_nameiop == DELETE || cnp->cn_nameiop == RENAME)) {
159 error = EROFS;
160 goto out;
161 }
162
163 /*
164 * Avoid doing a linear scan of the directory if the requested
165 * directory/name couple is already in the cache.
166 */
167 cachefound = cache_lookup(dvp, cnp->cn_nameptr, cnp->cn_namelen,
168 cnp->cn_nameiop, cnp->cn_flags,
169 &iswhiteout, vpp);
170 if (iswhiteout) {
171 cnp->cn_flags |= ISWHITEOUT;
172 }
173 if (cachefound && *vpp == NULLVP) {
174 /* Negative cache hit. */
175 error = ENOENT;
176 goto out_unlocked;
177 } else if (cachefound) {
178 error = 0;
179 goto out_unlocked;
180 }
181
182 /*
183 * Treat an unlinked directory as empty (no "." or "..")
184 */
185 if (dnode->tn_links == 0) {
186 KASSERT(dnode->tn_size == 0);
187 error = ENOENT;
188 goto out;
189 }
190
191 if (cnp->cn_flags & ISDOTDOT) {
192 tmpfs_node_t *pnode;
193
194 /*
195 * Lookup of ".." case.
196 */
197 if (lastcn && cnp->cn_nameiop == RENAME) {
198 error = EINVAL;
199 goto out;
200 }
201 KASSERT(dnode->tn_type == VDIR);
202 pnode = dnode->tn_spec.tn_dir.tn_parent;
203 if (pnode == NULL) {
204 error = ENOENT;
205 goto out;
206 }
207
208 /*
209 * Lock the parent tn_vlock before releasing the vnode lock,
210 * and thus prevent parent from disappearing.
211 */
212 mutex_enter(&pnode->tn_vlock);
213 VOP_UNLOCK(dvp);
214
215 /*
216 * Get a vnode of the '..' entry and re-acquire the lock.
217 * Release the tn_vlock.
218 */
219 error = tmpfs_vnode_get(dvp->v_mount, pnode, vpp);
220 vn_lock(dvp, LK_EXCLUSIVE | LK_RETRY);
221 goto out;
222
223 } else if (cnp->cn_namelen == 1 && cnp->cn_nameptr[0] == '.') {
224 /*
225 * Lookup of "." case.
226 */
227 if (lastcn && cnp->cn_nameiop == RENAME) {
228 error = EISDIR;
229 goto out;
230 }
231 vref(dvp);
232 *vpp = dvp;
233 error = 0;
234 goto done;
235 }
236
237 /*
238 * Other lookup cases: perform directory scan.
239 */
240 de = tmpfs_dir_lookup(dnode, cnp);
241 if (de == NULL || de->td_node == TMPFS_NODE_WHITEOUT) {
242 /*
243 * The entry was not found in the directory. This is valid
244 * if we are creating or renaming an entry and are working
245 * on the last component of the path name.
246 */
247 if (lastcn && (cnp->cn_nameiop == CREATE ||
248 cnp->cn_nameiop == RENAME)) {
249 error = VOP_ACCESS(dvp, VWRITE, cnp->cn_cred);
250 if (error) {
251 goto out;
252 }
253 error = EJUSTRETURN;
254 } else {
255 error = ENOENT;
256 }
257 if (de) {
258 KASSERT(de->td_node == TMPFS_NODE_WHITEOUT);
259 cnp->cn_flags |= ISWHITEOUT;
260 }
261 goto done;
262 }
263
264 tnode = de->td_node;
265
266 /*
267 * If it is not the last path component and found a non-directory
268 * or non-link entry (which may itself be pointing to a directory),
269 * raise an error.
270 */
271 if (!lastcn && tnode->tn_type != VDIR && tnode->tn_type != VLNK) {
272 error = ENOTDIR;
273 goto out;
274 }
275
276 /* Check the permissions. */
277 if (lastcn && (cnp->cn_nameiop == DELETE || cnp->cn_nameiop == RENAME)) {
278 error = VOP_ACCESS(dvp, VWRITE, cnp->cn_cred);
279 if (error)
280 goto out;
281
282 if ((dnode->tn_mode & S_ISTXT) != 0) {
283 error = kauth_authorize_vnode(cnp->cn_cred,
284 KAUTH_VNODE_DELETE, tnode->tn_vnode,
285 dnode->tn_vnode, genfs_can_sticky(cnp->cn_cred,
286 dnode->tn_uid, tnode->tn_uid));
287 if (error) {
288 error = EPERM;
289 goto out;
290 }
291 }
292 }
293
294 /* Get a vnode for the matching entry. */
295 mutex_enter(&tnode->tn_vlock);
296 error = tmpfs_vnode_get(dvp->v_mount, tnode, vpp);
297 done:
298 /*
299 * Cache the result, unless request was for creation (as it does
300 * not improve the performance).
301 */
302 if (cnp->cn_nameiop != CREATE) {
303 cache_enter(dvp, *vpp, cnp->cn_nameptr, cnp->cn_namelen,
304 cnp->cn_flags);
305 }
306 out:
307 if (error == 0 && *vpp != dvp)
308 VOP_UNLOCK(*vpp);
309 out_unlocked:
310 KASSERT(VOP_ISLOCKED(dvp));
311
312 return error;
313 }
314
315 int
316 tmpfs_create(void *v)
317 {
318 struct vop_create_v3_args /* {
319 struct vnode *a_dvp;
320 struct vnode **a_vpp;
321 struct componentname *a_cnp;
322 struct vattr *a_vap;
323 } */ *ap = v;
324 vnode_t *dvp = ap->a_dvp, **vpp = ap->a_vpp;
325 struct componentname *cnp = ap->a_cnp;
326 struct vattr *vap = ap->a_vap;
327
328 KASSERT(VOP_ISLOCKED(dvp));
329 KASSERT(vap->va_type == VREG || vap->va_type == VSOCK);
330 return tmpfs_construct_node(dvp, vpp, vap, cnp, NULL);
331 }
332
333 int
334 tmpfs_mknod(void *v)
335 {
336 struct vop_mknod_v3_args /* {
337 struct vnode *a_dvp;
338 struct vnode **a_vpp;
339 struct componentname *a_cnp;
340 struct vattr *a_vap;
341 } */ *ap = v;
342 vnode_t *dvp = ap->a_dvp, **vpp = ap->a_vpp;
343 struct componentname *cnp = ap->a_cnp;
344 struct vattr *vap = ap->a_vap;
345 enum vtype vt = vap->va_type;
346
347 if (vt != VBLK && vt != VCHR && vt != VFIFO) {
348 *vpp = NULL;
349 return EINVAL;
350 }
351 return tmpfs_construct_node(dvp, vpp, vap, cnp, NULL);
352 }
353
354 int
355 tmpfs_open(void *v)
356 {
357 struct vop_open_args /* {
358 struct vnode *a_vp;
359 int a_mode;
360 kauth_cred_t a_cred;
361 } */ *ap = v;
362 vnode_t *vp = ap->a_vp;
363 mode_t mode = ap->a_mode;
364 tmpfs_node_t *node;
365
366 KASSERT(VOP_ISLOCKED(vp));
367
368 node = VP_TO_TMPFS_NODE(vp);
369
370 /* If the file is marked append-only, deny write requests. */
371 if ((node->tn_flags & APPEND) != 0 &&
372 (mode & (FWRITE | O_APPEND)) == FWRITE) {
373 return EPERM;
374 }
375 return 0;
376 }
377
378 int
379 tmpfs_close(void *v)
380 {
381 struct vop_close_args /* {
382 struct vnode *a_vp;
383 int a_fflag;
384 kauth_cred_t a_cred;
385 } */ *ap = v;
386 vnode_t *vp __diagused = ap->a_vp;
387
388 KASSERT(VOP_ISLOCKED(vp));
389 return 0;
390 }
391
392 int
393 tmpfs_access(void *v)
394 {
395 struct vop_access_args /* {
396 struct vnode *a_vp;
397 int a_mode;
398 kauth_cred_t a_cred;
399 } */ *ap = v;
400 vnode_t *vp = ap->a_vp;
401 mode_t mode = ap->a_mode;
402 kauth_cred_t cred = ap->a_cred;
403 tmpfs_node_t *node = VP_TO_TMPFS_NODE(vp);
404 const bool writing = (mode & VWRITE) != 0;
405
406 KASSERT(VOP_ISLOCKED(vp));
407
408 /* Possible? */
409 switch (vp->v_type) {
410 case VDIR:
411 case VLNK:
412 case VREG:
413 if (writing && (vp->v_mount->mnt_flag & MNT_RDONLY) != 0) {
414 return EROFS;
415 }
416 break;
417 case VBLK:
418 case VCHR:
419 case VSOCK:
420 case VFIFO:
421 break;
422 default:
423 return EINVAL;
424 }
425 if (writing && (node->tn_flags & IMMUTABLE) != 0) {
426 return EPERM;
427 }
428
429 return kauth_authorize_vnode(cred, KAUTH_ACCESS_ACTION(mode,
430 vp->v_type, node->tn_mode), vp, NULL, genfs_can_access(vp->v_type,
431 node->tn_mode, node->tn_uid, node->tn_gid, mode, cred));
432 }
433
434 int
435 tmpfs_getattr(void *v)
436 {
437 struct vop_getattr_args /* {
438 struct vnode *a_vp;
439 struct vattr *a_vap;
440 kauth_cred_t a_cred;
441 } */ *ap = v;
442 vnode_t *vp = ap->a_vp;
443 struct vattr *vap = ap->a_vap;
444 tmpfs_node_t *node = VP_TO_TMPFS_NODE(vp);
445
446 vattr_null(vap);
447
448 vap->va_type = vp->v_type;
449 vap->va_mode = node->tn_mode;
450 vap->va_nlink = node->tn_links;
451 vap->va_uid = node->tn_uid;
452 vap->va_gid = node->tn_gid;
453 vap->va_fsid = vp->v_mount->mnt_stat.f_fsidx.__fsid_val[0];
454 vap->va_fileid = node->tn_id;
455 vap->va_size = node->tn_size;
456 vap->va_blocksize = PAGE_SIZE;
457 vap->va_atime = node->tn_atime;
458 vap->va_mtime = node->tn_mtime;
459 vap->va_ctime = node->tn_ctime;
460 vap->va_birthtime = node->tn_birthtime;
461 vap->va_gen = TMPFS_NODE_GEN(node);
462 vap->va_flags = node->tn_flags;
463 vap->va_rdev = (vp->v_type == VBLK || vp->v_type == VCHR) ?
464 node->tn_spec.tn_dev.tn_rdev : VNOVAL;
465 vap->va_bytes = round_page(node->tn_size);
466 vap->va_filerev = VNOVAL;
467 vap->va_vaflags = 0;
468 vap->va_spare = VNOVAL; /* XXX */
469
470 return 0;
471 }
472
473 int
474 tmpfs_setattr(void *v)
475 {
476 struct vop_setattr_args /* {
477 struct vnode *a_vp;
478 struct vattr *a_vap;
479 kauth_cred_t a_cred;
480 } */ *ap = v;
481 vnode_t *vp = ap->a_vp;
482 struct vattr *vap = ap->a_vap;
483 kauth_cred_t cred = ap->a_cred;
484 lwp_t *l = curlwp;
485 int error = 0;
486
487 KASSERT(VOP_ISLOCKED(vp));
488
489 /* Abort if any unsettable attribute is given. */
490 if (vap->va_type != VNON || vap->va_nlink != VNOVAL ||
491 vap->va_fsid != VNOVAL || vap->va_fileid != VNOVAL ||
492 vap->va_blocksize != VNOVAL || vap->va_ctime.tv_sec != VNOVAL ||
493 vap->va_gen != VNOVAL || vap->va_rdev != VNOVAL ||
494 vap->va_bytes != VNOVAL) {
495 return EINVAL;
496 }
497
498 if (error == 0 && vap->va_flags != VNOVAL)
499 error = tmpfs_chflags(vp, vap->va_flags, cred, l);
500
501 if (error == 0 && vap->va_size != VNOVAL)
502 error = tmpfs_chsize(vp, vap->va_size, cred, l);
503
504 if (error == 0 && (vap->va_uid != VNOVAL || vap->va_gid != VNOVAL))
505 error = tmpfs_chown(vp, vap->va_uid, vap->va_gid, cred, l);
506
507 if (error == 0 && vap->va_mode != VNOVAL)
508 error = tmpfs_chmod(vp, vap->va_mode, cred, l);
509
510 const bool chsometime =
511 vap->va_atime.tv_sec != VNOVAL ||
512 vap->va_mtime.tv_sec != VNOVAL ||
513 vap->va_birthtime.tv_sec != VNOVAL;
514 if (error == 0 && chsometime) {
515 error = tmpfs_chtimes(vp, &vap->va_atime, &vap->va_mtime,
516 &vap->va_birthtime, vap->va_vaflags, cred, l);
517 }
518 return error;
519 }
520
521 int
522 tmpfs_read(void *v)
523 {
524 struct vop_read_args /* {
525 struct vnode *a_vp;
526 struct uio *a_uio;
527 int a_ioflag;
528 kauth_cred_t a_cred;
529 } */ *ap = v;
530 vnode_t *vp = ap->a_vp;
531 struct uio *uio = ap->a_uio;
532 const int ioflag = ap->a_ioflag;
533 tmpfs_node_t *node;
534 struct uvm_object *uobj;
535 int error;
536
537 KASSERT(VOP_ISLOCKED(vp));
538
539 if (vp->v_type == VDIR) {
540 return EISDIR;
541 }
542 if (uio->uio_offset < 0 || vp->v_type != VREG) {
543 return EINVAL;
544 }
545
546 /* Note: reading zero bytes should not update atime. */
547 if (uio->uio_resid == 0) {
548 return 0;
549 }
550
551 node = VP_TO_TMPFS_NODE(vp);
552 uobj = node->tn_spec.tn_reg.tn_aobj;
553 error = 0;
554
555 while (error == 0 && uio->uio_resid > 0) {
556 vsize_t len;
557
558 if (node->tn_size <= uio->uio_offset) {
559 break;
560 }
561 len = MIN(node->tn_size - uio->uio_offset, uio->uio_resid);
562 if (len == 0) {
563 break;
564 }
565 error = ubc_uiomove(uobj, uio, len, IO_ADV_DECODE(ioflag),
566 UBC_READ | UBC_PARTIALOK | UBC_UNMAP_FLAG(vp));
567 }
568
569 tmpfs_update(vp, TMPFS_UPDATE_ATIME);
570 return error;
571 }
572
573 int
574 tmpfs_write(void *v)
575 {
576 struct vop_write_args /* {
577 struct vnode *a_vp;
578 struct uio *a_uio;
579 int a_ioflag;
580 kauth_cred_t a_cred;
581 } */ *ap = v;
582 vnode_t *vp = ap->a_vp;
583 struct uio *uio = ap->a_uio;
584 const int ioflag = ap->a_ioflag;
585 tmpfs_node_t *node;
586 struct uvm_object *uobj;
587 off_t oldsize;
588 int error;
589
590 KASSERT(VOP_ISLOCKED(vp));
591
592 if ((vp->v_mount->mnt_flag & MNT_RDONLY) != 0) {
593 error = EROFS;
594 goto out;
595 }
596
597 node = VP_TO_TMPFS_NODE(vp);
598 oldsize = node->tn_size;
599
600 if (uio->uio_offset < 0 || vp->v_type != VREG) {
601 error = EINVAL;
602 goto out;
603 }
604 if (uio->uio_resid == 0) {
605 error = 0;
606 goto out;
607 }
608 if (ioflag & IO_APPEND) {
609 uio->uio_offset = node->tn_size;
610 }
611
612 if (uio->uio_offset + uio->uio_resid > node->tn_size) {
613 error = tmpfs_reg_resize(vp, uio->uio_offset + uio->uio_resid);
614 if (error)
615 goto out;
616 }
617
618 uobj = node->tn_spec.tn_reg.tn_aobj;
619 error = 0;
620 while (error == 0 && uio->uio_resid > 0) {
621 vsize_t len;
622
623 len = MIN(node->tn_size - uio->uio_offset, uio->uio_resid);
624 if (len == 0) {
625 break;
626 }
627 error = ubc_uiomove(uobj, uio, len, IO_ADV_DECODE(ioflag),
628 UBC_WRITE | UBC_UNMAP_FLAG(vp));
629 }
630 if (error) {
631 (void)tmpfs_reg_resize(vp, oldsize);
632 }
633
634 tmpfs_update(vp, TMPFS_UPDATE_MTIME | TMPFS_UPDATE_CTIME);
635 VN_KNOTE(vp, NOTE_WRITE);
636 out:
637 if (error) {
638 KASSERT(oldsize == node->tn_size);
639 } else {
640 KASSERT(uio->uio_resid == 0);
641 }
642 return error;
643 }
644
645 int
646 tmpfs_fsync(void *v)
647 {
648 struct vop_fsync_args /* {
649 struct vnode *a_vp;
650 kauth_cred_t a_cred;
651 int a_flags;
652 off_t a_offlo;
653 off_t a_offhi;
654 struct lwp *a_l;
655 } */ *ap = v;
656 vnode_t *vp __diagused = ap->a_vp;
657
658 /* Nothing to do. Should be up to date. */
659 KASSERT(VOP_ISLOCKED(vp));
660 return 0;
661 }
662
663 /*
664 * tmpfs_remove: unlink a file.
665 *
666 * => Both directory (dvp) and file (vp) are locked.
667 * => We unlock and drop the reference on both.
668 */
669 int
670 tmpfs_remove(void *v)
671 {
672 struct vop_remove_args /* {
673 struct vnode *a_dvp;
674 struct vnode *a_vp;
675 struct componentname *a_cnp;
676 } */ *ap = v;
677 vnode_t *dvp = ap->a_dvp, *vp = ap->a_vp;
678 tmpfs_node_t *dnode, *node;
679 tmpfs_dirent_t *de;
680 int error;
681
682 KASSERT(VOP_ISLOCKED(dvp));
683 KASSERT(VOP_ISLOCKED(vp));
684
685 if (vp->v_type == VDIR) {
686 error = EPERM;
687 goto out;
688 }
689 dnode = VP_TO_TMPFS_DIR(dvp);
690 node = VP_TO_TMPFS_NODE(vp);
691
692 /*
693 * Files marked as immutable or append-only cannot be deleted.
694 * Likewise, files residing on directories marked as append-only
695 * cannot be deleted.
696 */
697 if (node->tn_flags & (IMMUTABLE | APPEND)) {
698 error = EPERM;
699 goto out;
700 }
701 if (dnode->tn_flags & APPEND) {
702 error = EPERM;
703 goto out;
704 }
705
706 /* Lookup the directory entry (check the cached hint first). */
707 de = tmpfs_dir_cached(node);
708 if (de == NULL) {
709 struct componentname *cnp = ap->a_cnp;
710 de = tmpfs_dir_lookup(dnode, cnp);
711 }
712 KASSERT(de && de->td_node == node);
713
714 /*
715 * Remove the entry from the directory (drops the link count) and
716 * destroy it or replace with a whiteout.
717 *
718 * Note: the inode referred by it will not be destroyed until the
719 * vnode is reclaimed/recycled.
720 */
721
722 tmpfs_dir_detach(dnode, de);
723
724 if (ap->a_cnp->cn_flags & DOWHITEOUT)
725 tmpfs_dir_attach(dnode, de, TMPFS_NODE_WHITEOUT);
726 else
727 tmpfs_free_dirent(VFS_TO_TMPFS(vp->v_mount), de);
728
729 if (node->tn_links > 0) {
730 /* We removed a hard link. */
731 tmpfs_update(vp, TMPFS_UPDATE_CTIME);
732 }
733 tmpfs_update(dvp, TMPFS_UPDATE_MTIME | TMPFS_UPDATE_CTIME);
734 error = 0;
735 out:
736 /* Drop the references and unlock the vnodes. */
737 vput(vp);
738 if (dvp == vp) {
739 vrele(dvp);
740 } else {
741 vput(dvp);
742 }
743 return error;
744 }
745
746 /*
747 * tmpfs_link: create a hard link.
748 */
749 int
750 tmpfs_link(void *v)
751 {
752 struct vop_link_args /* {
753 struct vnode *a_dvp;
754 struct vnode *a_vp;
755 struct componentname *a_cnp;
756 } */ *ap = v;
757 vnode_t *dvp = ap->a_dvp;
758 vnode_t *vp = ap->a_vp;
759 struct componentname *cnp = ap->a_cnp;
760 tmpfs_node_t *dnode, *node;
761 tmpfs_dirent_t *de;
762 int error;
763
764 KASSERT(dvp != vp);
765 KASSERT(VOP_ISLOCKED(dvp));
766 KASSERT(vp->v_type != VDIR);
767 KASSERT(dvp->v_mount == vp->v_mount);
768
769 dnode = VP_TO_TMPFS_DIR(dvp);
770 node = VP_TO_TMPFS_NODE(vp);
771
772 vn_lock(vp, LK_EXCLUSIVE | LK_RETRY);
773
774 /* Check for maximum number of links limit. */
775 if (node->tn_links == LINK_MAX) {
776 error = EMLINK;
777 goto out;
778 }
779 KASSERT(node->tn_links < LINK_MAX);
780
781 /* We cannot create links of files marked immutable or append-only. */
782 if (node->tn_flags & (IMMUTABLE | APPEND)) {
783 error = EPERM;
784 goto out;
785 }
786
787 /* Allocate a new directory entry to represent the inode. */
788 error = tmpfs_alloc_dirent(VFS_TO_TMPFS(vp->v_mount),
789 cnp->cn_nameptr, cnp->cn_namelen, &de);
790 if (error) {
791 goto out;
792 }
793
794 /*
795 * Insert the entry into the directory.
796 * It will increase the inode link count.
797 */
798 tmpfs_dir_attach(dnode, de, node);
799 tmpfs_update(dvp, TMPFS_UPDATE_MTIME | TMPFS_UPDATE_CTIME);
800
801 /* Update the timestamps and trigger the event. */
802 if (node->tn_vnode) {
803 VN_KNOTE(node->tn_vnode, NOTE_LINK);
804 }
805 tmpfs_update(vp, TMPFS_UPDATE_CTIME);
806 error = 0;
807 out:
808 VOP_UNLOCK(vp);
809 vput(dvp);
810 return error;
811 }
812
813 int
814 tmpfs_mkdir(void *v)
815 {
816 struct vop_mkdir_v3_args /* {
817 struct vnode *a_dvp;
818 struct vnode **a_vpp;
819 struct componentname *a_cnp;
820 struct vattr *a_vap;
821 } */ *ap = v;
822 vnode_t *dvp = ap->a_dvp;
823 vnode_t **vpp = ap->a_vpp;
824 struct componentname *cnp = ap->a_cnp;
825 struct vattr *vap = ap->a_vap;
826
827 KASSERT(vap->va_type == VDIR);
828 return tmpfs_construct_node(dvp, vpp, vap, cnp, NULL);
829 }
830
831 int
832 tmpfs_rmdir(void *v)
833 {
834 struct vop_rmdir_args /* {
835 struct vnode *a_dvp;
836 struct vnode *a_vp;
837 struct componentname *a_cnp;
838 } */ *ap = v;
839 vnode_t *dvp = ap->a_dvp;
840 vnode_t *vp = ap->a_vp;
841 tmpfs_mount_t *tmp = VFS_TO_TMPFS(dvp->v_mount);
842 tmpfs_node_t *dnode = VP_TO_TMPFS_DIR(dvp);
843 tmpfs_node_t *node = VP_TO_TMPFS_DIR(vp);
844 tmpfs_dirent_t *de;
845 int error = 0;
846
847 KASSERT(VOP_ISLOCKED(dvp));
848 KASSERT(VOP_ISLOCKED(vp));
849
850 /*
851 * Directories with more than two entries ('.' and '..') cannot be
852 * removed. There may be whiteout entries, which we will destroy.
853 */
854 if (node->tn_size > 0) {
855 /*
856 * If never had whiteout entries, the directory is certainly
857 * not empty. Otherwise, scan for any non-whiteout entry.
858 */
859 if ((node->tn_gen & TMPFS_WHITEOUT_BIT) == 0) {
860 error = ENOTEMPTY;
861 goto out;
862 }
863 TAILQ_FOREACH(de, &node->tn_spec.tn_dir.tn_dir, td_entries) {
864 if (de->td_node != TMPFS_NODE_WHITEOUT) {
865 error = ENOTEMPTY;
866 goto out;
867 }
868 }
869 KASSERT(error == 0);
870 }
871
872 KASSERT(node->tn_spec.tn_dir.tn_parent == dnode);
873
874 /* Lookup the directory entry (check the cached hint first). */
875 de = tmpfs_dir_cached(node);
876 if (de == NULL) {
877 struct componentname *cnp = ap->a_cnp;
878 de = tmpfs_dir_lookup(dnode, cnp);
879 }
880 KASSERT(de && de->td_node == node);
881
882 /* Check flags to see if we are allowed to remove the directory. */
883 if (dnode->tn_flags & APPEND || node->tn_flags & (IMMUTABLE | APPEND)) {
884 error = EPERM;
885 goto out;
886 }
887
888 /* Decrement the link count for the virtual '.' entry. */
889 node->tn_links--;
890
891 /* Detach the directory entry from the directory. */
892 tmpfs_dir_detach(dnode, de);
893
894 /* Purge the cache for parent. */
895 cache_purge(dvp);
896
897 /*
898 * Destroy the directory entry or replace it with a whiteout.
899 *
900 * Note: the inode referred by it will not be destroyed until the
901 * vnode is reclaimed.
902 */
903 if (ap->a_cnp->cn_flags & DOWHITEOUT)
904 tmpfs_dir_attach(dnode, de, TMPFS_NODE_WHITEOUT);
905 else
906 tmpfs_free_dirent(tmp, de);
907
908 /* Destroy the whiteout entries from the node. */
909 while ((de = TAILQ_FIRST(&node->tn_spec.tn_dir.tn_dir)) != NULL) {
910 KASSERT(de->td_node == TMPFS_NODE_WHITEOUT);
911 tmpfs_dir_detach(node, de);
912 tmpfs_free_dirent(tmp, de);
913 }
914 tmpfs_update(dvp, TMPFS_UPDATE_MTIME | TMPFS_UPDATE_CTIME);
915
916 KASSERT(node->tn_size == 0);
917 KASSERT(node->tn_links == 0);
918 out:
919 /* Release the nodes. */
920 vput(dvp);
921 vput(vp);
922 return error;
923 }
924
925 int
926 tmpfs_symlink(void *v)
927 {
928 struct vop_symlink_v3_args /* {
929 struct vnode *a_dvp;
930 struct vnode **a_vpp;
931 struct componentname *a_cnp;
932 struct vattr *a_vap;
933 char *a_target;
934 } */ *ap = v;
935 vnode_t *dvp = ap->a_dvp;
936 vnode_t **vpp = ap->a_vpp;
937 struct componentname *cnp = ap->a_cnp;
938 struct vattr *vap = ap->a_vap;
939 char *target = ap->a_target;
940
941 KASSERT(vap->va_type == VLNK);
942 return tmpfs_construct_node(dvp, vpp, vap, cnp, target);
943 }
944
945 int
946 tmpfs_readdir(void *v)
947 {
948 struct vop_readdir_args /* {
949 struct vnode *a_vp;
950 struct uio *a_uio;
951 kauth_cred_t a_cred;
952 int *a_eofflag;
953 off_t **a_cookies;
954 int *ncookies;
955 } */ *ap = v;
956 vnode_t *vp = ap->a_vp;
957 struct uio *uio = ap->a_uio;
958 int *eofflag = ap->a_eofflag;
959 off_t **cookies = ap->a_cookies;
960 int *ncookies = ap->a_ncookies;
961 off_t startoff, cnt;
962 tmpfs_node_t *node;
963 int error;
964
965 KASSERT(VOP_ISLOCKED(vp));
966
967 /* This operation only makes sense on directory nodes. */
968 if (vp->v_type != VDIR) {
969 return ENOTDIR;
970 }
971 node = VP_TO_TMPFS_DIR(vp);
972 startoff = uio->uio_offset;
973 cnt = 0;
974
975 /*
976 * Retrieve the directory entries, unless it is being destroyed.
977 */
978 if (node->tn_links) {
979 error = tmpfs_dir_getdents(node, uio, &cnt);
980 } else {
981 error = 0;
982 }
983
984 if (eofflag != NULL) {
985 *eofflag = !error && uio->uio_offset == TMPFS_DIRSEQ_EOF;
986 }
987 if (error || cookies == NULL || ncookies == NULL) {
988 return error;
989 }
990
991 /* Update NFS-related variables, if any. */
992 tmpfs_dirent_t *de = NULL;
993 off_t i, off = startoff;
994
995 *cookies = malloc(cnt * sizeof(off_t), M_TEMP, M_WAITOK);
996 *ncookies = cnt;
997
998 for (i = 0; i < cnt; i++) {
999 KASSERT(off != TMPFS_DIRSEQ_EOF);
1000 if (off != TMPFS_DIRSEQ_DOT) {
1001 if (off == TMPFS_DIRSEQ_DOTDOT) {
1002 de = TAILQ_FIRST(&node->tn_spec.tn_dir.tn_dir);
1003 } else if (de != NULL) {
1004 de = TAILQ_NEXT(de, td_entries);
1005 } else {
1006 de = tmpfs_dir_lookupbyseq(node, off);
1007 KASSERT(de != NULL);
1008 de = TAILQ_NEXT(de, td_entries);
1009 }
1010 if (de == NULL) {
1011 off = TMPFS_DIRSEQ_EOF;
1012 } else {
1013 off = tmpfs_dir_getseq(node, de);
1014 }
1015 } else {
1016 off = TMPFS_DIRSEQ_DOTDOT;
1017 }
1018 (*cookies)[i] = off;
1019 }
1020 KASSERT(uio->uio_offset == off);
1021 return error;
1022 }
1023
1024 int
1025 tmpfs_readlink(void *v)
1026 {
1027 struct vop_readlink_args /* {
1028 struct vnode *a_vp;
1029 struct uio *a_uio;
1030 kauth_cred_t a_cred;
1031 } */ *ap = v;
1032 vnode_t *vp = ap->a_vp;
1033 struct uio *uio = ap->a_uio;
1034 tmpfs_node_t *node = VP_TO_TMPFS_NODE(vp);
1035 int error;
1036
1037 KASSERT(VOP_ISLOCKED(vp));
1038 KASSERT(uio->uio_offset == 0);
1039 KASSERT(vp->v_type == VLNK);
1040
1041 /* Note: readlink(2) returns the path without NUL terminator. */
1042 if (node->tn_size > 0) {
1043 error = uiomove(node->tn_spec.tn_lnk.tn_link,
1044 MIN(node->tn_size, uio->uio_resid), uio);
1045 } else {
1046 error = 0;
1047 }
1048 tmpfs_update(vp, TMPFS_UPDATE_ATIME);
1049
1050 return error;
1051 }
1052
1053 int
1054 tmpfs_inactive(void *v)
1055 {
1056 struct vop_inactive_args /* {
1057 struct vnode *a_vp;
1058 bool *a_recycle;
1059 } */ *ap = v;
1060 vnode_t *vp = ap->a_vp;
1061 tmpfs_node_t *node;
1062
1063 KASSERT(VOP_ISLOCKED(vp));
1064
1065 node = VP_TO_TMPFS_NODE(vp);
1066 if (node->tn_links == 0) {
1067 /*
1068 * Mark node as dead by setting its generation to zero.
1069 */
1070 atomic_and_32(&node->tn_gen, ~TMPFS_NODE_GEN_MASK);
1071 *ap->a_recycle = true;
1072 } else {
1073 *ap->a_recycle = false;
1074 }
1075 VOP_UNLOCK(vp);
1076
1077 return 0;
1078 }
1079
1080 int
1081 tmpfs_reclaim(void *v)
1082 {
1083 struct vop_reclaim_args /* {
1084 struct vnode *a_vp;
1085 } */ *ap = v;
1086 vnode_t *vp = ap->a_vp;
1087 tmpfs_mount_t *tmp = VFS_TO_TMPFS(vp->v_mount);
1088 tmpfs_node_t *node = VP_TO_TMPFS_NODE(vp);
1089 bool recycle;
1090
1091 mutex_enter(&node->tn_vlock);
1092
1093 /* Disassociate inode from vnode. */
1094 node->tn_vnode = NULL;
1095 vp->v_data = NULL;
1096
1097 /* If inode is not referenced, i.e. no links, then destroy it. */
1098 recycle = node->tn_links == 0 && TMPFS_NODE_RECLAIMING(node) == 0;
1099
1100 mutex_exit(&node->tn_vlock);
1101
1102 if (recycle) {
1103 tmpfs_free_node(tmp, node);
1104 }
1105 return 0;
1106 }
1107
1108 int
1109 tmpfs_pathconf(void *v)
1110 {
1111 struct vop_pathconf_args /* {
1112 struct vnode *a_vp;
1113 int a_name;
1114 register_t *a_retval;
1115 } */ *ap = v;
1116 const int name = ap->a_name;
1117 register_t *retval = ap->a_retval;
1118 int error = 0;
1119
1120 switch (name) {
1121 case _PC_LINK_MAX:
1122 *retval = LINK_MAX;
1123 break;
1124 case _PC_NAME_MAX:
1125 *retval = TMPFS_MAXNAMLEN;
1126 break;
1127 case _PC_PATH_MAX:
1128 *retval = PATH_MAX;
1129 break;
1130 case _PC_PIPE_BUF:
1131 *retval = PIPE_BUF;
1132 break;
1133 case _PC_CHOWN_RESTRICTED:
1134 *retval = 1;
1135 break;
1136 case _PC_NO_TRUNC:
1137 *retval = 1;
1138 break;
1139 case _PC_SYNC_IO:
1140 *retval = 1;
1141 break;
1142 case _PC_FILESIZEBITS:
1143 *retval = sizeof(off_t) * CHAR_BIT;
1144 break;
1145 default:
1146 error = EINVAL;
1147 }
1148 return error;
1149 }
1150
1151 int
1152 tmpfs_advlock(void *v)
1153 {
1154 struct vop_advlock_args /* {
1155 struct vnode *a_vp;
1156 void * a_id;
1157 int a_op;
1158 struct flock *a_fl;
1159 int a_flags;
1160 } */ *ap = v;
1161 vnode_t *vp = ap->a_vp;
1162 tmpfs_node_t *node = VP_TO_TMPFS_NODE(vp);
1163
1164 return lf_advlock(v, &node->tn_lockf, node->tn_size);
1165 }
1166
1167 int
1168 tmpfs_getpages(void *v)
1169 {
1170 struct vop_getpages_args /* {
1171 struct vnode *a_vp;
1172 voff_t a_offset;
1173 struct vm_page **a_m;
1174 int *a_count;
1175 int a_centeridx;
1176 vm_prot_t a_access_type;
1177 int a_advice;
1178 int a_flags;
1179 } */ * const ap = v;
1180 vnode_t *vp = ap->a_vp;
1181 const voff_t offset = ap->a_offset;
1182 struct vm_page **pgs = ap->a_m;
1183 const int centeridx = ap->a_centeridx;
1184 const vm_prot_t access_type = ap->a_access_type;
1185 const int advice = ap->a_advice;
1186 const int flags = ap->a_flags;
1187 int error, npages = *ap->a_count;
1188 tmpfs_node_t *node;
1189 struct uvm_object *uobj;
1190
1191 KASSERT(vp->v_type == VREG);
1192 KASSERT(mutex_owned(vp->v_interlock));
1193
1194 node = VP_TO_TMPFS_NODE(vp);
1195 uobj = node->tn_spec.tn_reg.tn_aobj;
1196
1197 /*
1198 * Currently, PGO_PASTEOF is not supported.
1199 */
1200 if (vp->v_size <= offset + (centeridx << PAGE_SHIFT)) {
1201 if ((flags & PGO_LOCKED) == 0)
1202 mutex_exit(vp->v_interlock);
1203 return EINVAL;
1204 }
1205
1206 if (vp->v_size < offset + (npages << PAGE_SHIFT)) {
1207 npages = (round_page(vp->v_size) - offset) >> PAGE_SHIFT;
1208 }
1209
1210 if ((flags & PGO_LOCKED) != 0)
1211 return EBUSY;
1212
1213 if ((flags & PGO_NOTIMESTAMP) == 0) {
1214 u_int tflags = 0;
1215
1216 if ((vp->v_mount->mnt_flag & MNT_NOATIME) == 0)
1217 tflags |= TMPFS_UPDATE_ATIME;
1218
1219 if ((access_type & VM_PROT_WRITE) != 0) {
1220 tflags |= TMPFS_UPDATE_MTIME;
1221 if (vp->v_mount->mnt_flag & MNT_RELATIME)
1222 tflags |= TMPFS_UPDATE_ATIME;
1223 }
1224 tmpfs_update(vp, tflags);
1225 }
1226
1227 /*
1228 * Invoke the pager.
1229 *
1230 * Clean the array of pages before. XXX: PR/32166
1231 * Note that vnode lock is shared with underlying UVM object.
1232 */
1233 if (pgs) {
1234 memset(pgs, 0, sizeof(struct vm_pages *) * npages);
1235 }
1236 KASSERT(vp->v_interlock == uobj->vmobjlock);
1237
1238 error = (*uobj->pgops->pgo_get)(uobj, offset, pgs, &npages, centeridx,
1239 access_type, advice, flags | PGO_ALLPAGES);
1240
1241 #if defined(DEBUG)
1242 if (!error && pgs) {
1243 for (int i = 0; i < npages; i++) {
1244 KASSERT(pgs[i] != NULL);
1245 }
1246 }
1247 #endif
1248 return error;
1249 }
1250
1251 int
1252 tmpfs_putpages(void *v)
1253 {
1254 struct vop_putpages_args /* {
1255 struct vnode *a_vp;
1256 voff_t a_offlo;
1257 voff_t a_offhi;
1258 int a_flags;
1259 } */ * const ap = v;
1260 vnode_t *vp = ap->a_vp;
1261 const voff_t offlo = ap->a_offlo;
1262 const voff_t offhi = ap->a_offhi;
1263 const int flags = ap->a_flags;
1264 tmpfs_node_t *node;
1265 struct uvm_object *uobj;
1266 int error;
1267
1268 KASSERT(mutex_owned(vp->v_interlock));
1269
1270 if (vp->v_type != VREG) {
1271 mutex_exit(vp->v_interlock);
1272 return 0;
1273 }
1274
1275 if ((vp->v_mount->mnt_flag & MNT_RDONLY) != 0) {
1276 mutex_exit(vp->v_interlock);
1277 return EROFS;
1278 }
1279
1280 node = VP_TO_TMPFS_NODE(vp);
1281 uobj = node->tn_spec.tn_reg.tn_aobj;
1282
1283 KASSERT(vp->v_interlock == uobj->vmobjlock);
1284 error = (*uobj->pgops->pgo_put)(uobj, offlo, offhi, flags);
1285
1286 /* XXX mtime */
1287
1288 return error;
1289 }
1290
1291 int
1292 tmpfs_whiteout(void *v)
1293 {
1294 struct vop_whiteout_args /* {
1295 struct vnode *a_dvp;
1296 struct componentname *a_cnp;
1297 int a_flags;
1298 } */ *ap = v;
1299 vnode_t *dvp = ap->a_dvp;
1300 struct componentname *cnp = ap->a_cnp;
1301 const int flags = ap->a_flags;
1302 tmpfs_mount_t *tmp = VFS_TO_TMPFS(dvp->v_mount);
1303 tmpfs_node_t *dnode = VP_TO_TMPFS_DIR(dvp);
1304 tmpfs_dirent_t *de;
1305 int error;
1306
1307 switch (flags) {
1308 case LOOKUP:
1309 break;
1310 case CREATE:
1311 error = tmpfs_alloc_dirent(tmp, cnp->cn_nameptr,
1312 cnp->cn_namelen, &de);
1313 if (error)
1314 return error;
1315 tmpfs_dir_attach(dnode, de, TMPFS_NODE_WHITEOUT);
1316 break;
1317 case DELETE:
1318 cnp->cn_flags &= ~DOWHITEOUT; /* when in doubt, cargo cult */
1319 de = tmpfs_dir_lookup(dnode, cnp);
1320 if (de == NULL)
1321 return ENOENT;
1322 tmpfs_dir_detach(dnode, de);
1323 tmpfs_free_dirent(tmp, de);
1324 break;
1325 }
1326 tmpfs_update(dvp, TMPFS_UPDATE_MTIME | TMPFS_UPDATE_CTIME);
1327 return 0;
1328 }
1329
1330 int
1331 tmpfs_print(void *v)
1332 {
1333 struct vop_print_args /* {
1334 struct vnode *a_vp;
1335 } */ *ap = v;
1336 vnode_t *vp = ap->a_vp;
1337 tmpfs_node_t *node = VP_TO_TMPFS_NODE(vp);
1338
1339 printf("tag VT_TMPFS, tmpfs_node %p, flags 0x%x, links %d\n"
1340 "\tmode 0%o, owner %d, group %d, size %" PRIdMAX,
1341 node, node->tn_flags, node->tn_links, node->tn_mode, node->tn_uid,
1342 node->tn_gid, (uintmax_t)node->tn_size);
1343 if (vp->v_type == VFIFO) {
1344 VOCALL(fifo_vnodeop_p, VOFFSET(vop_print), v);
1345 }
1346 printf("\n");
1347 return 0;
1348 }
1349