tmpfs_vnops.c revision 1.92.2.7 1 /* $NetBSD: tmpfs_vnops.c,v 1.92.2.7 2014/05/22 11:41:02 yamt Exp $ */
2
3 /*
4 * Copyright (c) 2005, 2006, 2007 The NetBSD Foundation, Inc.
5 * All rights reserved.
6 *
7 * This code is derived from software contributed to The NetBSD Foundation
8 * by Julio M. Merino Vidal, developed as part of Google's Summer of Code
9 * 2005 program.
10 *
11 * Redistribution and use in source and binary forms, with or without
12 * modification, are permitted provided that the following conditions
13 * are met:
14 * 1. Redistributions of source code must retain the above copyright
15 * notice, this list of conditions and the following disclaimer.
16 * 2. Redistributions in binary form must reproduce the above copyright
17 * notice, this list of conditions and the following disclaimer in the
18 * documentation and/or other materials provided with the distribution.
19 *
20 * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
21 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
22 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
23 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
24 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
25 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
26 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
27 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
28 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
29 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
30 * POSSIBILITY OF SUCH DAMAGE.
31 */
32
33 /*
34 * tmpfs vnode interface.
35 */
36
37 #include <sys/cdefs.h>
38 __KERNEL_RCSID(0, "$NetBSD: tmpfs_vnops.c,v 1.92.2.7 2014/05/22 11:41:02 yamt Exp $");
39
40 #include <sys/param.h>
41 #include <sys/dirent.h>
42 #include <sys/fcntl.h>
43 #include <sys/event.h>
44 #include <sys/malloc.h>
45 #include <sys/namei.h>
46 #include <sys/stat.h>
47 #include <sys/uio.h>
48 #include <sys/unistd.h>
49 #include <sys/vnode.h>
50 #include <sys/lockf.h>
51 #include <sys/kauth.h>
52 #include <sys/atomic.h>
53
54 #include <uvm/uvm.h>
55
56 #include <miscfs/fifofs/fifo.h>
57 #include <miscfs/genfs/genfs.h>
58 #include <fs/tmpfs/tmpfs_vnops.h>
59 #include <fs/tmpfs/tmpfs.h>
60
61 /*
62 * vnode operations vector used for files stored in a tmpfs file system.
63 */
64 int (**tmpfs_vnodeop_p)(void *);
65 const struct vnodeopv_entry_desc tmpfs_vnodeop_entries[] = {
66 { &vop_default_desc, vn_default_error },
67 { &vop_lookup_desc, tmpfs_lookup },
68 { &vop_create_desc, tmpfs_create },
69 { &vop_mknod_desc, tmpfs_mknod },
70 { &vop_open_desc, tmpfs_open },
71 { &vop_close_desc, tmpfs_close },
72 { &vop_access_desc, tmpfs_access },
73 { &vop_getattr_desc, tmpfs_getattr },
74 { &vop_setattr_desc, tmpfs_setattr },
75 { &vop_read_desc, tmpfs_read },
76 { &vop_write_desc, tmpfs_write },
77 { &vop_ioctl_desc, tmpfs_ioctl },
78 { &vop_fcntl_desc, tmpfs_fcntl },
79 { &vop_poll_desc, tmpfs_poll },
80 { &vop_kqfilter_desc, tmpfs_kqfilter },
81 { &vop_revoke_desc, tmpfs_revoke },
82 { &vop_mmap_desc, tmpfs_mmap },
83 { &vop_fsync_desc, tmpfs_fsync },
84 { &vop_seek_desc, tmpfs_seek },
85 { &vop_remove_desc, tmpfs_remove },
86 { &vop_link_desc, tmpfs_link },
87 { &vop_rename_desc, tmpfs_rename },
88 { &vop_mkdir_desc, tmpfs_mkdir },
89 { &vop_rmdir_desc, tmpfs_rmdir },
90 { &vop_symlink_desc, tmpfs_symlink },
91 { &vop_readdir_desc, tmpfs_readdir },
92 { &vop_readlink_desc, tmpfs_readlink },
93 { &vop_abortop_desc, tmpfs_abortop },
94 { &vop_inactive_desc, tmpfs_inactive },
95 { &vop_reclaim_desc, tmpfs_reclaim },
96 { &vop_lock_desc, tmpfs_lock },
97 { &vop_unlock_desc, tmpfs_unlock },
98 { &vop_bmap_desc, tmpfs_bmap },
99 { &vop_strategy_desc, tmpfs_strategy },
100 { &vop_print_desc, tmpfs_print },
101 { &vop_pathconf_desc, tmpfs_pathconf },
102 { &vop_islocked_desc, tmpfs_islocked },
103 { &vop_advlock_desc, tmpfs_advlock },
104 { &vop_bwrite_desc, tmpfs_bwrite },
105 { &vop_getpages_desc, tmpfs_getpages },
106 { &vop_putpages_desc, tmpfs_putpages },
107 { &vop_whiteout_desc, tmpfs_whiteout },
108 { NULL, NULL }
109 };
110
111 const struct vnodeopv_desc tmpfs_vnodeop_opv_desc = {
112 &tmpfs_vnodeop_p, tmpfs_vnodeop_entries
113 };
114
115 /*
116 * tmpfs_lookup: path name traversal routine.
117 *
118 * Arguments: dvp (directory being searched), vpp (result),
119 * cnp (component name - path).
120 *
121 * => Caller holds a reference and lock on dvp.
122 * => We return looked-up vnode (vpp) locked, with a reference held.
123 */
124 int
125 tmpfs_lookup(void *v)
126 {
127 struct vop_lookup_v2_args /* {
128 struct vnode *a_dvp;
129 struct vnode **a_vpp;
130 struct componentname *a_cnp;
131 } */ *ap = v;
132 vnode_t *dvp = ap->a_dvp, **vpp = ap->a_vpp;
133 struct componentname *cnp = ap->a_cnp;
134 const bool lastcn = (cnp->cn_flags & ISLASTCN) != 0;
135 tmpfs_node_t *dnode, *tnode;
136 tmpfs_dirent_t *de;
137 int cachefound, iswhiteout;
138 int error;
139
140 KASSERT(VOP_ISLOCKED(dvp));
141
142 dnode = VP_TO_TMPFS_DIR(dvp);
143 *vpp = NULL;
144
145 /* Check accessibility of directory. */
146 error = VOP_ACCESS(dvp, VEXEC, cnp->cn_cred);
147 if (error) {
148 goto out;
149 }
150
151 /*
152 * If requesting the last path component on a read-only file system
153 * with a write operation, deny it.
154 */
155 if (lastcn && (dvp->v_mount->mnt_flag & MNT_RDONLY) != 0 &&
156 (cnp->cn_nameiop == DELETE || cnp->cn_nameiop == RENAME)) {
157 error = EROFS;
158 goto out;
159 }
160
161 /*
162 * Avoid doing a linear scan of the directory if the requested
163 * directory/name couple is already in the cache.
164 */
165 cachefound = cache_lookup(dvp, cnp->cn_nameptr, cnp->cn_namelen,
166 cnp->cn_nameiop, cnp->cn_flags,
167 &iswhiteout, vpp);
168 if (iswhiteout) {
169 cnp->cn_flags |= ISWHITEOUT;
170 }
171 if (cachefound && *vpp == NULLVP) {
172 /* Negative cache hit. */
173 error = ENOENT;
174 goto out_unlocked;
175 } else if (cachefound) {
176 error = 0;
177 goto out_unlocked;
178 }
179
180 /*
181 * Treat an unlinked directory as empty (no "." or "..")
182 */
183 if (dnode->tn_links == 0) {
184 KASSERT(dnode->tn_size == 0);
185 error = ENOENT;
186 goto out;
187 }
188
189 if (cnp->cn_flags & ISDOTDOT) {
190 tmpfs_node_t *pnode;
191
192 /*
193 * Lookup of ".." case.
194 */
195 if (lastcn && cnp->cn_nameiop == RENAME) {
196 error = EINVAL;
197 goto out;
198 }
199 KASSERT(dnode->tn_type == VDIR);
200 pnode = dnode->tn_spec.tn_dir.tn_parent;
201 if (pnode == NULL) {
202 error = ENOENT;
203 goto out;
204 }
205
206 /*
207 * Lock the parent tn_vlock before releasing the vnode lock,
208 * and thus prevent parent from disappearing.
209 */
210 mutex_enter(&pnode->tn_vlock);
211 VOP_UNLOCK(dvp);
212
213 /*
214 * Get a vnode of the '..' entry and re-acquire the lock.
215 * Release the tn_vlock.
216 */
217 error = tmpfs_vnode_get(dvp->v_mount, pnode, vpp);
218 vn_lock(dvp, LK_EXCLUSIVE | LK_RETRY);
219 goto out;
220
221 } else if (cnp->cn_namelen == 1 && cnp->cn_nameptr[0] == '.') {
222 /*
223 * Lookup of "." case.
224 */
225 if (lastcn && cnp->cn_nameiop == RENAME) {
226 error = EISDIR;
227 goto out;
228 }
229 vref(dvp);
230 *vpp = dvp;
231 error = 0;
232 goto done;
233 }
234
235 /*
236 * Other lookup cases: perform directory scan.
237 */
238 de = tmpfs_dir_lookup(dnode, cnp);
239 if (de == NULL || de->td_node == TMPFS_NODE_WHITEOUT) {
240 /*
241 * The entry was not found in the directory. This is valid
242 * if we are creating or renaming an entry and are working
243 * on the last component of the path name.
244 */
245 if (lastcn && (cnp->cn_nameiop == CREATE ||
246 cnp->cn_nameiop == RENAME)) {
247 error = VOP_ACCESS(dvp, VWRITE, cnp->cn_cred);
248 if (error) {
249 goto out;
250 }
251 error = EJUSTRETURN;
252 } else {
253 error = ENOENT;
254 }
255 if (de) {
256 KASSERT(de->td_node == TMPFS_NODE_WHITEOUT);
257 cnp->cn_flags |= ISWHITEOUT;
258 }
259 goto done;
260 }
261
262 tnode = de->td_node;
263
264 /*
265 * If it is not the last path component and found a non-directory
266 * or non-link entry (which may itself be pointing to a directory),
267 * raise an error.
268 */
269 if (!lastcn && tnode->tn_type != VDIR && tnode->tn_type != VLNK) {
270 error = ENOTDIR;
271 goto out;
272 }
273
274 /* Check the permissions. */
275 if (lastcn && (cnp->cn_nameiop == DELETE || cnp->cn_nameiop == RENAME)) {
276 error = VOP_ACCESS(dvp, VWRITE, cnp->cn_cred);
277 if (error)
278 goto out;
279
280 if ((dnode->tn_mode & S_ISTXT) != 0) {
281 error = kauth_authorize_vnode(cnp->cn_cred,
282 KAUTH_VNODE_DELETE, tnode->tn_vnode,
283 dnode->tn_vnode, genfs_can_sticky(cnp->cn_cred,
284 dnode->tn_uid, tnode->tn_uid));
285 if (error) {
286 error = EPERM;
287 goto out;
288 }
289 }
290 }
291
292 /* Get a vnode for the matching entry. */
293 mutex_enter(&tnode->tn_vlock);
294 error = tmpfs_vnode_get(dvp->v_mount, tnode, vpp);
295 done:
296 /*
297 * Cache the result, unless request was for creation (as it does
298 * not improve the performance).
299 */
300 if (cnp->cn_nameiop != CREATE) {
301 cache_enter(dvp, *vpp, cnp->cn_nameptr, cnp->cn_namelen,
302 cnp->cn_flags);
303 }
304 out:
305 if (error == 0 && *vpp != dvp)
306 VOP_UNLOCK(*vpp);
307 out_unlocked:
308 KASSERT(VOP_ISLOCKED(dvp));
309
310 return error;
311 }
312
313 int
314 tmpfs_create(void *v)
315 {
316 struct vop_create_v3_args /* {
317 struct vnode *a_dvp;
318 struct vnode **a_vpp;
319 struct componentname *a_cnp;
320 struct vattr *a_vap;
321 } */ *ap = v;
322 vnode_t *dvp = ap->a_dvp, **vpp = ap->a_vpp;
323 struct componentname *cnp = ap->a_cnp;
324 struct vattr *vap = ap->a_vap;
325
326 KASSERT(VOP_ISLOCKED(dvp));
327 KASSERT(vap->va_type == VREG || vap->va_type == VSOCK);
328 return tmpfs_construct_node(dvp, vpp, vap, cnp, NULL);
329 }
330
331 int
332 tmpfs_mknod(void *v)
333 {
334 struct vop_mknod_v3_args /* {
335 struct vnode *a_dvp;
336 struct vnode **a_vpp;
337 struct componentname *a_cnp;
338 struct vattr *a_vap;
339 } */ *ap = v;
340 vnode_t *dvp = ap->a_dvp, **vpp = ap->a_vpp;
341 struct componentname *cnp = ap->a_cnp;
342 struct vattr *vap = ap->a_vap;
343 enum vtype vt = vap->va_type;
344
345 if (vt != VBLK && vt != VCHR && vt != VFIFO) {
346 vput(dvp);
347 return EINVAL;
348 }
349 return tmpfs_construct_node(dvp, vpp, vap, cnp, NULL);
350 }
351
352 int
353 tmpfs_open(void *v)
354 {
355 struct vop_open_args /* {
356 struct vnode *a_vp;
357 int a_mode;
358 kauth_cred_t a_cred;
359 } */ *ap = v;
360 vnode_t *vp = ap->a_vp;
361 mode_t mode = ap->a_mode;
362 tmpfs_node_t *node;
363
364 KASSERT(VOP_ISLOCKED(vp));
365
366 node = VP_TO_TMPFS_NODE(vp);
367
368 /* If the file is marked append-only, deny write requests. */
369 if ((node->tn_flags & APPEND) != 0 &&
370 (mode & (FWRITE | O_APPEND)) == FWRITE) {
371 return EPERM;
372 }
373 return 0;
374 }
375
376 int
377 tmpfs_close(void *v)
378 {
379 struct vop_close_args /* {
380 struct vnode *a_vp;
381 int a_fflag;
382 kauth_cred_t a_cred;
383 } */ *ap = v;
384 vnode_t *vp __diagused = ap->a_vp;
385
386 KASSERT(VOP_ISLOCKED(vp));
387 return 0;
388 }
389
390 int
391 tmpfs_access(void *v)
392 {
393 struct vop_access_args /* {
394 struct vnode *a_vp;
395 int a_mode;
396 kauth_cred_t a_cred;
397 } */ *ap = v;
398 vnode_t *vp = ap->a_vp;
399 mode_t mode = ap->a_mode;
400 kauth_cred_t cred = ap->a_cred;
401 tmpfs_node_t *node = VP_TO_TMPFS_NODE(vp);
402 const bool writing = (mode & VWRITE) != 0;
403
404 KASSERT(VOP_ISLOCKED(vp));
405
406 /* Possible? */
407 switch (vp->v_type) {
408 case VDIR:
409 case VLNK:
410 case VREG:
411 if (writing && (vp->v_mount->mnt_flag & MNT_RDONLY) != 0) {
412 return EROFS;
413 }
414 break;
415 case VBLK:
416 case VCHR:
417 case VSOCK:
418 case VFIFO:
419 break;
420 default:
421 return EINVAL;
422 }
423 if (writing && (node->tn_flags & IMMUTABLE) != 0) {
424 return EPERM;
425 }
426
427 return kauth_authorize_vnode(cred, KAUTH_ACCESS_ACTION(mode,
428 vp->v_type, node->tn_mode), vp, NULL, genfs_can_access(vp->v_type,
429 node->tn_mode, node->tn_uid, node->tn_gid, mode, cred));
430 }
431
432 int
433 tmpfs_getattr(void *v)
434 {
435 struct vop_getattr_args /* {
436 struct vnode *a_vp;
437 struct vattr *a_vap;
438 kauth_cred_t a_cred;
439 } */ *ap = v;
440 vnode_t *vp = ap->a_vp;
441 struct vattr *vap = ap->a_vap;
442 tmpfs_node_t *node = VP_TO_TMPFS_NODE(vp);
443
444 vattr_null(vap);
445
446 vap->va_type = vp->v_type;
447 vap->va_mode = node->tn_mode;
448 vap->va_nlink = node->tn_links;
449 vap->va_uid = node->tn_uid;
450 vap->va_gid = node->tn_gid;
451 vap->va_fsid = vp->v_mount->mnt_stat.f_fsidx.__fsid_val[0];
452 vap->va_fileid = node->tn_id;
453 vap->va_size = node->tn_size;
454 vap->va_blocksize = PAGE_SIZE;
455 vap->va_atime = node->tn_atime;
456 vap->va_mtime = node->tn_mtime;
457 vap->va_ctime = node->tn_ctime;
458 vap->va_birthtime = node->tn_birthtime;
459 vap->va_gen = TMPFS_NODE_GEN(node);
460 vap->va_flags = node->tn_flags;
461 vap->va_rdev = (vp->v_type == VBLK || vp->v_type == VCHR) ?
462 node->tn_spec.tn_dev.tn_rdev : VNOVAL;
463 vap->va_bytes = round_page(node->tn_size);
464 vap->va_filerev = VNOVAL;
465 vap->va_vaflags = 0;
466 vap->va_spare = VNOVAL; /* XXX */
467
468 return 0;
469 }
470
471 int
472 tmpfs_setattr(void *v)
473 {
474 struct vop_setattr_args /* {
475 struct vnode *a_vp;
476 struct vattr *a_vap;
477 kauth_cred_t a_cred;
478 } */ *ap = v;
479 vnode_t *vp = ap->a_vp;
480 struct vattr *vap = ap->a_vap;
481 kauth_cred_t cred = ap->a_cred;
482 lwp_t *l = curlwp;
483 int error = 0;
484
485 KASSERT(VOP_ISLOCKED(vp));
486
487 /* Abort if any unsettable attribute is given. */
488 if (vap->va_type != VNON || vap->va_nlink != VNOVAL ||
489 vap->va_fsid != VNOVAL || vap->va_fileid != VNOVAL ||
490 vap->va_blocksize != VNOVAL || vap->va_ctime.tv_sec != VNOVAL ||
491 vap->va_gen != VNOVAL || vap->va_rdev != VNOVAL ||
492 vap->va_bytes != VNOVAL) {
493 return EINVAL;
494 }
495
496 if (error == 0 && vap->va_flags != VNOVAL)
497 error = tmpfs_chflags(vp, vap->va_flags, cred, l);
498
499 if (error == 0 && vap->va_size != VNOVAL)
500 error = tmpfs_chsize(vp, vap->va_size, cred, l);
501
502 if (error == 0 && (vap->va_uid != VNOVAL || vap->va_gid != VNOVAL))
503 error = tmpfs_chown(vp, vap->va_uid, vap->va_gid, cred, l);
504
505 if (error == 0 && vap->va_mode != VNOVAL)
506 error = tmpfs_chmod(vp, vap->va_mode, cred, l);
507
508 const bool chsometime =
509 vap->va_atime.tv_sec != VNOVAL ||
510 vap->va_mtime.tv_sec != VNOVAL ||
511 vap->va_birthtime.tv_sec != VNOVAL;
512 if (error == 0 && chsometime) {
513 error = tmpfs_chtimes(vp, &vap->va_atime, &vap->va_mtime,
514 &vap->va_birthtime, vap->va_vaflags, cred, l);
515 }
516 return error;
517 }
518
519 int
520 tmpfs_read(void *v)
521 {
522 struct vop_read_args /* {
523 struct vnode *a_vp;
524 struct uio *a_uio;
525 int a_ioflag;
526 kauth_cred_t a_cred;
527 } */ *ap = v;
528 vnode_t *vp = ap->a_vp;
529 struct uio *uio = ap->a_uio;
530 const int ioflag = ap->a_ioflag;
531 tmpfs_node_t *node;
532 struct uvm_object *uobj;
533 const int advice = IO_ADV_DECODE(ioflag);
534 int error;
535
536 KASSERT(VOP_ISLOCKED(vp));
537
538 if (vp->v_type == VDIR) {
539 return EISDIR;
540 }
541 if (uio->uio_offset < 0 || vp->v_type != VREG) {
542 return EINVAL;
543 }
544
545 /* Note: reading zero bytes should not update atime. */
546 if (uio->uio_resid == 0) {
547 return 0;
548 }
549
550 node = VP_TO_TMPFS_NODE(vp);
551 uobj = node->tn_spec.tn_reg.tn_aobj;
552 error = 0;
553
554 if (uio->uio_offset + uio->uio_resid <= node->tn_size) {
555 uvm_loanobj(&vp->v_uobj, uio, advice);
556 }
557 while (error == 0 && uio->uio_resid > 0) {
558 vsize_t len;
559
560 if (node->tn_size <= uio->uio_offset) {
561 break;
562 }
563 len = MIN(node->tn_size - uio->uio_offset, uio->uio_resid);
564 if (len == 0) {
565 break;
566 }
567 error = ubc_uiomove(uobj, uio, len, advice,
568 UBC_READ | UBC_PARTIALOK | UBC_UNMAP_FLAG(vp));
569 }
570
571 tmpfs_update(vp, TMPFS_UPDATE_ATIME);
572 return error;
573 }
574
575 int
576 tmpfs_write(void *v)
577 {
578 struct vop_write_args /* {
579 struct vnode *a_vp;
580 struct uio *a_uio;
581 int a_ioflag;
582 kauth_cred_t a_cred;
583 } */ *ap = v;
584 vnode_t *vp = ap->a_vp;
585 struct uio *uio = ap->a_uio;
586 const int ioflag = ap->a_ioflag;
587 tmpfs_node_t *node;
588 struct uvm_object *uobj;
589 off_t oldsize;
590 int error;
591
592 KASSERT(VOP_ISLOCKED(vp));
593
594 node = VP_TO_TMPFS_NODE(vp);
595 oldsize = node->tn_size;
596
597 if (uio->uio_offset < 0 || vp->v_type != VREG) {
598 error = EINVAL;
599 goto out;
600 }
601 if (uio->uio_resid == 0) {
602 error = 0;
603 goto out;
604 }
605 if (ioflag & IO_APPEND) {
606 uio->uio_offset = node->tn_size;
607 }
608
609 if (uio->uio_offset + uio->uio_resid > node->tn_size) {
610 error = tmpfs_reg_resize(vp, uio->uio_offset + uio->uio_resid);
611 if (error)
612 goto out;
613 }
614
615 uobj = node->tn_spec.tn_reg.tn_aobj;
616 error = 0;
617 while (error == 0 && uio->uio_resid > 0) {
618 vsize_t len;
619
620 len = MIN(node->tn_size - uio->uio_offset, uio->uio_resid);
621 if (len == 0) {
622 break;
623 }
624 error = ubc_uiomove(uobj, uio, len, IO_ADV_DECODE(ioflag),
625 UBC_WRITE | UBC_UNMAP_FLAG(vp));
626 }
627 if (error) {
628 (void)tmpfs_reg_resize(vp, oldsize);
629 }
630
631 tmpfs_update(vp, TMPFS_UPDATE_MTIME | TMPFS_UPDATE_CTIME);
632 VN_KNOTE(vp, NOTE_WRITE);
633 out:
634 if (error) {
635 KASSERT(oldsize == node->tn_size);
636 } else {
637 KASSERT(uio->uio_resid == 0);
638 }
639 return error;
640 }
641
642 int
643 tmpfs_fsync(void *v)
644 {
645 struct vop_fsync_args /* {
646 struct vnode *a_vp;
647 kauth_cred_t a_cred;
648 int a_flags;
649 off_t a_offlo;
650 off_t a_offhi;
651 struct lwp *a_l;
652 } */ *ap = v;
653 vnode_t *vp __diagused = ap->a_vp;
654
655 /* Nothing to do. Should be up to date. */
656 KASSERT(VOP_ISLOCKED(vp));
657 return 0;
658 }
659
660 /*
661 * tmpfs_remove: unlink a file.
662 *
663 * => Both directory (dvp) and file (vp) are locked.
664 * => We unlock and drop the reference on both.
665 */
666 int
667 tmpfs_remove(void *v)
668 {
669 struct vop_remove_args /* {
670 struct vnode *a_dvp;
671 struct vnode *a_vp;
672 struct componentname *a_cnp;
673 } */ *ap = v;
674 vnode_t *dvp = ap->a_dvp, *vp = ap->a_vp;
675 tmpfs_node_t *dnode, *node;
676 tmpfs_dirent_t *de;
677 int error;
678
679 KASSERT(VOP_ISLOCKED(dvp));
680 KASSERT(VOP_ISLOCKED(vp));
681
682 if (vp->v_type == VDIR) {
683 error = EPERM;
684 goto out;
685 }
686 dnode = VP_TO_TMPFS_DIR(dvp);
687 node = VP_TO_TMPFS_NODE(vp);
688
689 /*
690 * Files marked as immutable or append-only cannot be deleted.
691 * Likewise, files residing on directories marked as append-only
692 * cannot be deleted.
693 */
694 if (node->tn_flags & (IMMUTABLE | APPEND)) {
695 error = EPERM;
696 goto out;
697 }
698 if (dnode->tn_flags & APPEND) {
699 error = EPERM;
700 goto out;
701 }
702
703 /* Lookup the directory entry (check the cached hint first). */
704 de = tmpfs_dir_cached(node);
705 if (de == NULL) {
706 struct componentname *cnp = ap->a_cnp;
707 de = tmpfs_dir_lookup(dnode, cnp);
708 }
709 KASSERT(de && de->td_node == node);
710
711 /*
712 * Remove the entry from the directory (drops the link count) and
713 * destroy it or replace with a whiteout.
714 *
715 * Note: the inode referred by it will not be destroyed until the
716 * vnode is reclaimed/recycled.
717 */
718
719 tmpfs_dir_detach(dnode, de);
720
721 if (ap->a_cnp->cn_flags & DOWHITEOUT)
722 tmpfs_dir_attach(dnode, de, TMPFS_NODE_WHITEOUT);
723 else
724 tmpfs_free_dirent(VFS_TO_TMPFS(vp->v_mount), de);
725
726 if (node->tn_links > 0) {
727 /* We removed a hard link. */
728 tmpfs_update(vp, TMPFS_UPDATE_CTIME);
729 }
730 tmpfs_update(dvp, TMPFS_UPDATE_MTIME | TMPFS_UPDATE_CTIME);
731 error = 0;
732 out:
733 /* Drop the references and unlock the vnodes. */
734 vput(vp);
735 if (dvp == vp) {
736 vrele(dvp);
737 } else {
738 vput(dvp);
739 }
740 return error;
741 }
742
743 /*
744 * tmpfs_link: create a hard link.
745 */
746 int
747 tmpfs_link(void *v)
748 {
749 struct vop_link_args /* {
750 struct vnode *a_dvp;
751 struct vnode *a_vp;
752 struct componentname *a_cnp;
753 } */ *ap = v;
754 vnode_t *dvp = ap->a_dvp;
755 vnode_t *vp = ap->a_vp;
756 struct componentname *cnp = ap->a_cnp;
757 tmpfs_node_t *dnode, *node;
758 tmpfs_dirent_t *de;
759 int error;
760
761 KASSERT(dvp != vp);
762 KASSERT(VOP_ISLOCKED(dvp));
763 KASSERT(vp->v_type != VDIR);
764 KASSERT(dvp->v_mount == vp->v_mount);
765
766 dnode = VP_TO_TMPFS_DIR(dvp);
767 node = VP_TO_TMPFS_NODE(vp);
768
769 vn_lock(vp, LK_EXCLUSIVE | LK_RETRY);
770
771 /* Check for maximum number of links limit. */
772 if (node->tn_links == LINK_MAX) {
773 error = EMLINK;
774 goto out;
775 }
776 KASSERT(node->tn_links < LINK_MAX);
777
778 /* We cannot create links of files marked immutable or append-only. */
779 if (node->tn_flags & (IMMUTABLE | APPEND)) {
780 error = EPERM;
781 goto out;
782 }
783
784 /* Allocate a new directory entry to represent the inode. */
785 error = tmpfs_alloc_dirent(VFS_TO_TMPFS(vp->v_mount),
786 cnp->cn_nameptr, cnp->cn_namelen, &de);
787 if (error) {
788 goto out;
789 }
790
791 /*
792 * Insert the entry into the directory.
793 * It will increase the inode link count.
794 */
795 tmpfs_dir_attach(dnode, de, node);
796 tmpfs_update(dvp, TMPFS_UPDATE_MTIME | TMPFS_UPDATE_CTIME);
797
798 /* Update the timestamps and trigger the event. */
799 if (node->tn_vnode) {
800 VN_KNOTE(node->tn_vnode, NOTE_LINK);
801 }
802 tmpfs_update(vp, TMPFS_UPDATE_CTIME);
803 error = 0;
804 out:
805 VOP_UNLOCK(vp);
806 vput(dvp);
807 return error;
808 }
809
810 int
811 tmpfs_mkdir(void *v)
812 {
813 struct vop_mkdir_v3_args /* {
814 struct vnode *a_dvp;
815 struct vnode **a_vpp;
816 struct componentname *a_cnp;
817 struct vattr *a_vap;
818 } */ *ap = v;
819 vnode_t *dvp = ap->a_dvp;
820 vnode_t **vpp = ap->a_vpp;
821 struct componentname *cnp = ap->a_cnp;
822 struct vattr *vap = ap->a_vap;
823
824 KASSERT(vap->va_type == VDIR);
825 return tmpfs_construct_node(dvp, vpp, vap, cnp, NULL);
826 }
827
828 int
829 tmpfs_rmdir(void *v)
830 {
831 struct vop_rmdir_args /* {
832 struct vnode *a_dvp;
833 struct vnode *a_vp;
834 struct componentname *a_cnp;
835 } */ *ap = v;
836 vnode_t *dvp = ap->a_dvp;
837 vnode_t *vp = ap->a_vp;
838 tmpfs_mount_t *tmp = VFS_TO_TMPFS(dvp->v_mount);
839 tmpfs_node_t *dnode = VP_TO_TMPFS_DIR(dvp);
840 tmpfs_node_t *node = VP_TO_TMPFS_DIR(vp);
841 tmpfs_dirent_t *de;
842 int error = 0;
843
844 KASSERT(VOP_ISLOCKED(dvp));
845 KASSERT(VOP_ISLOCKED(vp));
846
847 /*
848 * Directories with more than two entries ('.' and '..') cannot be
849 * removed. There may be whiteout entries, which we will destroy.
850 */
851 if (node->tn_size > 0) {
852 /*
853 * If never had whiteout entries, the directory is certainly
854 * not empty. Otherwise, scan for any non-whiteout entry.
855 */
856 if ((node->tn_gen & TMPFS_WHITEOUT_BIT) == 0) {
857 error = ENOTEMPTY;
858 goto out;
859 }
860 TAILQ_FOREACH(de, &node->tn_spec.tn_dir.tn_dir, td_entries) {
861 if (de->td_node != TMPFS_NODE_WHITEOUT) {
862 error = ENOTEMPTY;
863 goto out;
864 }
865 }
866 KASSERT(error == 0);
867 }
868
869 KASSERT(node->tn_spec.tn_dir.tn_parent == dnode);
870
871 /* Lookup the directory entry (check the cached hint first). */
872 de = tmpfs_dir_cached(node);
873 if (de == NULL) {
874 struct componentname *cnp = ap->a_cnp;
875 de = tmpfs_dir_lookup(dnode, cnp);
876 }
877 KASSERT(de && de->td_node == node);
878
879 /* Check flags to see if we are allowed to remove the directory. */
880 if (dnode->tn_flags & APPEND || node->tn_flags & (IMMUTABLE | APPEND)) {
881 error = EPERM;
882 goto out;
883 }
884
885 /* Decrement the link count for the virtual '.' entry. */
886 node->tn_links--;
887
888 /* Detach the directory entry from the directory. */
889 tmpfs_dir_detach(dnode, de);
890
891 /* Purge the cache for parent. */
892 cache_purge(dvp);
893
894 /*
895 * Destroy the directory entry or replace it with a whiteout.
896 *
897 * Note: the inode referred by it will not be destroyed until the
898 * vnode is reclaimed.
899 */
900 if (ap->a_cnp->cn_flags & DOWHITEOUT)
901 tmpfs_dir_attach(dnode, de, TMPFS_NODE_WHITEOUT);
902 else
903 tmpfs_free_dirent(tmp, de);
904
905 /* Destroy the whiteout entries from the node. */
906 while ((de = TAILQ_FIRST(&node->tn_spec.tn_dir.tn_dir)) != NULL) {
907 KASSERT(de->td_node == TMPFS_NODE_WHITEOUT);
908 tmpfs_dir_detach(node, de);
909 tmpfs_free_dirent(tmp, de);
910 }
911 tmpfs_update(dvp, TMPFS_UPDATE_MTIME | TMPFS_UPDATE_CTIME);
912
913 KASSERT(node->tn_size == 0);
914 KASSERT(node->tn_links == 0);
915 out:
916 /* Release the nodes. */
917 vput(dvp);
918 vput(vp);
919 return error;
920 }
921
922 int
923 tmpfs_symlink(void *v)
924 {
925 struct vop_symlink_v3_args /* {
926 struct vnode *a_dvp;
927 struct vnode **a_vpp;
928 struct componentname *a_cnp;
929 struct vattr *a_vap;
930 char *a_target;
931 } */ *ap = v;
932 vnode_t *dvp = ap->a_dvp;
933 vnode_t **vpp = ap->a_vpp;
934 struct componentname *cnp = ap->a_cnp;
935 struct vattr *vap = ap->a_vap;
936 char *target = ap->a_target;
937
938 KASSERT(vap->va_type == VLNK);
939 return tmpfs_construct_node(dvp, vpp, vap, cnp, target);
940 }
941
942 int
943 tmpfs_readdir(void *v)
944 {
945 struct vop_readdir_args /* {
946 struct vnode *a_vp;
947 struct uio *a_uio;
948 kauth_cred_t a_cred;
949 int *a_eofflag;
950 off_t **a_cookies;
951 int *ncookies;
952 } */ *ap = v;
953 vnode_t *vp = ap->a_vp;
954 struct uio *uio = ap->a_uio;
955 int *eofflag = ap->a_eofflag;
956 off_t **cookies = ap->a_cookies;
957 int *ncookies = ap->a_ncookies;
958 off_t startoff, cnt;
959 tmpfs_node_t *node;
960 int error;
961
962 KASSERT(VOP_ISLOCKED(vp));
963
964 /* This operation only makes sense on directory nodes. */
965 if (vp->v_type != VDIR) {
966 return ENOTDIR;
967 }
968 node = VP_TO_TMPFS_DIR(vp);
969 startoff = uio->uio_offset;
970 cnt = 0;
971
972 /*
973 * Retrieve the directory entries, unless it is being destroyed.
974 */
975 if (node->tn_links) {
976 error = tmpfs_dir_getdents(node, uio, &cnt);
977 } else {
978 error = 0;
979 }
980
981 if (eofflag != NULL) {
982 *eofflag = !error && uio->uio_offset == TMPFS_DIRSEQ_EOF;
983 }
984 if (error || cookies == NULL || ncookies == NULL) {
985 return error;
986 }
987
988 /* Update NFS-related variables, if any. */
989 tmpfs_dirent_t *de = NULL;
990 off_t i, off = startoff;
991
992 *cookies = malloc(cnt * sizeof(off_t), M_TEMP, M_WAITOK);
993 *ncookies = cnt;
994
995 for (i = 0; i < cnt; i++) {
996 KASSERT(off != TMPFS_DIRSEQ_EOF);
997 if (off != TMPFS_DIRSEQ_DOT) {
998 if (off == TMPFS_DIRSEQ_DOTDOT) {
999 de = TAILQ_FIRST(&node->tn_spec.tn_dir.tn_dir);
1000 } else if (de != NULL) {
1001 de = TAILQ_NEXT(de, td_entries);
1002 } else {
1003 de = tmpfs_dir_lookupbyseq(node, off);
1004 KASSERT(de != NULL);
1005 de = TAILQ_NEXT(de, td_entries);
1006 }
1007 if (de == NULL) {
1008 off = TMPFS_DIRSEQ_EOF;
1009 } else {
1010 off = tmpfs_dir_getseq(node, de);
1011 }
1012 } else {
1013 off = TMPFS_DIRSEQ_DOTDOT;
1014 }
1015 (*cookies)[i] = off;
1016 }
1017 KASSERT(uio->uio_offset == off);
1018 return error;
1019 }
1020
1021 int
1022 tmpfs_readlink(void *v)
1023 {
1024 struct vop_readlink_args /* {
1025 struct vnode *a_vp;
1026 struct uio *a_uio;
1027 kauth_cred_t a_cred;
1028 } */ *ap = v;
1029 vnode_t *vp = ap->a_vp;
1030 struct uio *uio = ap->a_uio;
1031 tmpfs_node_t *node = VP_TO_TMPFS_NODE(vp);
1032 int error;
1033
1034 KASSERT(VOP_ISLOCKED(vp));
1035 KASSERT(uio->uio_offset == 0);
1036 KASSERT(vp->v_type == VLNK);
1037
1038 /* Note: readlink(2) returns the path without NUL terminator. */
1039 if (node->tn_size > 0) {
1040 error = uiomove(node->tn_spec.tn_lnk.tn_link,
1041 MIN(node->tn_size - 1, uio->uio_resid), uio);
1042 } else {
1043 error = 0;
1044 }
1045 tmpfs_update(vp, TMPFS_UPDATE_ATIME);
1046
1047 return error;
1048 }
1049
1050 int
1051 tmpfs_inactive(void *v)
1052 {
1053 struct vop_inactive_args /* {
1054 struct vnode *a_vp;
1055 bool *a_recycle;
1056 } */ *ap = v;
1057 vnode_t *vp = ap->a_vp;
1058 tmpfs_node_t *node;
1059
1060 KASSERT(VOP_ISLOCKED(vp));
1061
1062 node = VP_TO_TMPFS_NODE(vp);
1063 if (node->tn_links == 0) {
1064 /*
1065 * Mark node as dead by setting its generation to zero.
1066 */
1067 atomic_and_32(&node->tn_gen, ~TMPFS_NODE_GEN_MASK);
1068 *ap->a_recycle = true;
1069 } else {
1070 *ap->a_recycle = false;
1071 }
1072 VOP_UNLOCK(vp);
1073
1074 return 0;
1075 }
1076
1077 int
1078 tmpfs_reclaim(void *v)
1079 {
1080 struct vop_reclaim_args /* {
1081 struct vnode *a_vp;
1082 } */ *ap = v;
1083 vnode_t *vp = ap->a_vp;
1084 tmpfs_mount_t *tmp = VFS_TO_TMPFS(vp->v_mount);
1085 tmpfs_node_t *node = VP_TO_TMPFS_NODE(vp);
1086 bool recycle;
1087
1088 mutex_enter(&node->tn_vlock);
1089
1090 /* Disassociate inode from vnode. */
1091 node->tn_vnode = NULL;
1092 vp->v_data = NULL;
1093
1094 /* If inode is not referenced, i.e. no links, then destroy it. */
1095 recycle = node->tn_links == 0 && TMPFS_NODE_RECLAIMING(node) == 0;
1096
1097 mutex_exit(&node->tn_vlock);
1098
1099 if (recycle) {
1100 tmpfs_free_node(tmp, node);
1101 }
1102 return 0;
1103 }
1104
1105 int
1106 tmpfs_pathconf(void *v)
1107 {
1108 struct vop_pathconf_args /* {
1109 struct vnode *a_vp;
1110 int a_name;
1111 register_t *a_retval;
1112 } */ *ap = v;
1113 const int name = ap->a_name;
1114 register_t *retval = ap->a_retval;
1115 int error = 0;
1116
1117 switch (name) {
1118 case _PC_LINK_MAX:
1119 *retval = LINK_MAX;
1120 break;
1121 case _PC_NAME_MAX:
1122 *retval = TMPFS_MAXNAMLEN;
1123 break;
1124 case _PC_PATH_MAX:
1125 *retval = PATH_MAX;
1126 break;
1127 case _PC_PIPE_BUF:
1128 *retval = PIPE_BUF;
1129 break;
1130 case _PC_CHOWN_RESTRICTED:
1131 *retval = 1;
1132 break;
1133 case _PC_NO_TRUNC:
1134 *retval = 1;
1135 break;
1136 case _PC_SYNC_IO:
1137 *retval = 1;
1138 break;
1139 case _PC_FILESIZEBITS:
1140 *retval = sizeof(off_t) * CHAR_BIT;
1141 break;
1142 default:
1143 error = EINVAL;
1144 }
1145 return error;
1146 }
1147
1148 int
1149 tmpfs_advlock(void *v)
1150 {
1151 struct vop_advlock_args /* {
1152 struct vnode *a_vp;
1153 void * a_id;
1154 int a_op;
1155 struct flock *a_fl;
1156 int a_flags;
1157 } */ *ap = v;
1158 vnode_t *vp = ap->a_vp;
1159 tmpfs_node_t *node = VP_TO_TMPFS_NODE(vp);
1160
1161 return lf_advlock(v, &node->tn_lockf, node->tn_size);
1162 }
1163
1164 int
1165 tmpfs_getpages(void *v)
1166 {
1167 struct vop_getpages_args /* {
1168 struct vnode *a_vp;
1169 voff_t a_offset;
1170 struct vm_page **a_m;
1171 int *a_count;
1172 int a_centeridx;
1173 vm_prot_t a_access_type;
1174 int a_advice;
1175 int a_flags;
1176 } */ * const ap = v;
1177 vnode_t *vp = ap->a_vp;
1178 const voff_t offset = ap->a_offset;
1179 struct vm_page **pgs = ap->a_m;
1180 const int centeridx = ap->a_centeridx;
1181 const vm_prot_t access_type = ap->a_access_type;
1182 const int advice = ap->a_advice;
1183 const int flags = ap->a_flags;
1184 int error, npages = *ap->a_count;
1185 tmpfs_node_t *node;
1186 struct uvm_object *uobj;
1187
1188 KASSERT(vp->v_type == VREG);
1189 KASSERT(mutex_owned(vp->v_interlock));
1190
1191 node = VP_TO_TMPFS_NODE(vp);
1192 uobj = node->tn_spec.tn_reg.tn_aobj;
1193
1194 /*
1195 * Currently, PGO_PASTEOF is not supported.
1196 */
1197 if (vp->v_size <= offset + (centeridx << PAGE_SHIFT)) {
1198 if ((flags & PGO_LOCKED) == 0)
1199 mutex_exit(vp->v_interlock);
1200 return EINVAL;
1201 }
1202
1203 if (vp->v_size < offset + (npages << PAGE_SHIFT)) {
1204 npages = (round_page(vp->v_size) - offset) >> PAGE_SHIFT;
1205 }
1206
1207 if ((flags & PGO_LOCKED) != 0)
1208 return EBUSY;
1209
1210 if ((flags & PGO_NOTIMESTAMP) == 0) {
1211 u_int tflags = 0;
1212
1213 if ((vp->v_mount->mnt_flag & MNT_NOATIME) == 0)
1214 tflags |= TMPFS_UPDATE_ATIME;
1215
1216 if ((access_type & VM_PROT_WRITE) != 0) {
1217 tflags |= TMPFS_UPDATE_MTIME;
1218 if (vp->v_mount->mnt_flag & MNT_RELATIME)
1219 tflags |= TMPFS_UPDATE_ATIME;
1220 }
1221 tmpfs_update(vp, tflags);
1222 }
1223
1224 /*
1225 * Invoke the pager.
1226 *
1227 * Clean the array of pages before. XXX: PR/32166
1228 * Note that vnode lock is shared with underlying UVM object.
1229 */
1230 if (pgs) {
1231 memset(pgs, 0, sizeof(struct vm_pages *) * npages);
1232 }
1233 KASSERT(vp->v_interlock == uobj->vmobjlock);
1234
1235 error = (*uobj->pgops->pgo_get)(uobj, offset, pgs, &npages, centeridx,
1236 access_type, advice, flags | PGO_ALLPAGES);
1237
1238 #if defined(DEBUG)
1239 if (!error && pgs) {
1240 for (int i = 0; i < npages; i++) {
1241 KASSERT(pgs[i] != NULL);
1242 }
1243 }
1244 #endif
1245 return error;
1246 }
1247
1248 int
1249 tmpfs_putpages(void *v)
1250 {
1251 struct vop_putpages_args /* {
1252 struct vnode *a_vp;
1253 voff_t a_offlo;
1254 voff_t a_offhi;
1255 int a_flags;
1256 } */ * const ap = v;
1257 vnode_t *vp = ap->a_vp;
1258 const voff_t offlo = ap->a_offlo;
1259 const voff_t offhi = ap->a_offhi;
1260 const int flags = ap->a_flags;
1261 tmpfs_node_t *node;
1262 struct uvm_object *uobj;
1263 int error;
1264
1265 KASSERT(mutex_owned(vp->v_interlock));
1266
1267 if (vp->v_type != VREG) {
1268 mutex_exit(vp->v_interlock);
1269 return 0;
1270 }
1271
1272 node = VP_TO_TMPFS_NODE(vp);
1273 uobj = node->tn_spec.tn_reg.tn_aobj;
1274
1275 KASSERT(vp->v_interlock == uobj->vmobjlock);
1276 error = (*uobj->pgops->pgo_put)(uobj, offlo, offhi, flags);
1277
1278 /* XXX mtime */
1279
1280 return error;
1281 }
1282
1283 int
1284 tmpfs_whiteout(void *v)
1285 {
1286 struct vop_whiteout_args /* {
1287 struct vnode *a_dvp;
1288 struct componentname *a_cnp;
1289 int a_flags;
1290 } */ *ap = v;
1291 vnode_t *dvp = ap->a_dvp;
1292 struct componentname *cnp = ap->a_cnp;
1293 const int flags = ap->a_flags;
1294 tmpfs_mount_t *tmp = VFS_TO_TMPFS(dvp->v_mount);
1295 tmpfs_node_t *dnode = VP_TO_TMPFS_DIR(dvp);
1296 tmpfs_dirent_t *de;
1297 int error;
1298
1299 switch (flags) {
1300 case LOOKUP:
1301 break;
1302 case CREATE:
1303 error = tmpfs_alloc_dirent(tmp, cnp->cn_nameptr,
1304 cnp->cn_namelen, &de);
1305 if (error)
1306 return error;
1307 tmpfs_dir_attach(dnode, de, TMPFS_NODE_WHITEOUT);
1308 break;
1309 case DELETE:
1310 cnp->cn_flags &= ~DOWHITEOUT; /* when in doubt, cargo cult */
1311 de = tmpfs_dir_lookup(dnode, cnp);
1312 if (de == NULL)
1313 return ENOENT;
1314 tmpfs_dir_detach(dnode, de);
1315 tmpfs_free_dirent(tmp, de);
1316 break;
1317 }
1318 tmpfs_update(dvp, TMPFS_UPDATE_MTIME | TMPFS_UPDATE_CTIME);
1319 return 0;
1320 }
1321
1322 int
1323 tmpfs_print(void *v)
1324 {
1325 struct vop_print_args /* {
1326 struct vnode *a_vp;
1327 } */ *ap = v;
1328 vnode_t *vp = ap->a_vp;
1329 tmpfs_node_t *node = VP_TO_TMPFS_NODE(vp);
1330
1331 printf("tag VT_TMPFS, tmpfs_node %p, flags 0x%x, links %d\n"
1332 "\tmode 0%o, owner %d, group %d, size %" PRIdMAX,
1333 node, node->tn_flags, node->tn_links, node->tn_mode, node->tn_uid,
1334 node->tn_gid, (uintmax_t)node->tn_size);
1335 if (vp->v_type == VFIFO) {
1336 VOCALL(fifo_vnodeop_p, VOFFSET(vop_print), v);
1337 }
1338 printf("\n");
1339 return 0;
1340 }
1341