lfs_vnops.c revision 1.333 1 1.333 christos /* $NetBSD: lfs_vnops.c,v 1.333 2020/05/16 18:31:53 christos Exp $ */
2 1.2 cgd
3 1.22 perseant /*-
4 1.84 perseant * Copyright (c) 1999, 2000, 2001, 2002, 2003 The NetBSD Foundation, Inc.
5 1.22 perseant * All rights reserved.
6 1.22 perseant *
7 1.22 perseant * This code is derived from software contributed to The NetBSD Foundation
8 1.22 perseant * by Konrad E. Schroder <perseant (at) hhhh.org>.
9 1.22 perseant *
10 1.22 perseant * Redistribution and use in source and binary forms, with or without
11 1.22 perseant * modification, are permitted provided that the following conditions
12 1.22 perseant * are met:
13 1.22 perseant * 1. Redistributions of source code must retain the above copyright
14 1.22 perseant * notice, this list of conditions and the following disclaimer.
15 1.22 perseant * 2. Redistributions in binary form must reproduce the above copyright
16 1.22 perseant * notice, this list of conditions and the following disclaimer in the
17 1.22 perseant * documentation and/or other materials provided with the distribution.
18 1.22 perseant *
19 1.22 perseant * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.22 perseant * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.22 perseant * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.22 perseant * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.22 perseant * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.22 perseant * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.22 perseant * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.22 perseant * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.22 perseant * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.22 perseant * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.22 perseant * POSSIBILITY OF SUCH DAMAGE.
30 1.22 perseant */
31 1.1 mycroft /*
32 1.15 fvdl * Copyright (c) 1986, 1989, 1991, 1993, 1995
33 1.1 mycroft * The Regents of the University of California. All rights reserved.
34 1.1 mycroft *
35 1.1 mycroft * Redistribution and use in source and binary forms, with or without
36 1.1 mycroft * modification, are permitted provided that the following conditions
37 1.1 mycroft * are met:
38 1.1 mycroft * 1. Redistributions of source code must retain the above copyright
39 1.1 mycroft * notice, this list of conditions and the following disclaimer.
40 1.1 mycroft * 2. Redistributions in binary form must reproduce the above copyright
41 1.1 mycroft * notice, this list of conditions and the following disclaimer in the
42 1.1 mycroft * documentation and/or other materials provided with the distribution.
43 1.114 agc * 3. Neither the name of the University nor the names of its contributors
44 1.1 mycroft * may be used to endorse or promote products derived from this software
45 1.1 mycroft * without specific prior written permission.
46 1.1 mycroft *
47 1.1 mycroft * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
48 1.1 mycroft * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
49 1.1 mycroft * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
50 1.1 mycroft * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
51 1.1 mycroft * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
52 1.1 mycroft * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
53 1.1 mycroft * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
54 1.1 mycroft * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
55 1.1 mycroft * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
56 1.1 mycroft * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
57 1.1 mycroft * SUCH DAMAGE.
58 1.1 mycroft *
59 1.15 fvdl * @(#)lfs_vnops.c 8.13 (Berkeley) 6/10/95
60 1.1 mycroft */
61 1.58 lukem
62 1.302 dholland /* from NetBSD: ufs_vnops.c,v 1.232 2016/05/19 18:32:03 riastradh Exp */
63 1.265 dholland /*-
64 1.265 dholland * Copyright (c) 2008 The NetBSD Foundation, Inc.
65 1.265 dholland * All rights reserved.
66 1.265 dholland *
67 1.265 dholland * This code is derived from software contributed to The NetBSD Foundation
68 1.265 dholland * by Wasabi Systems, Inc.
69 1.265 dholland *
70 1.265 dholland * Redistribution and use in source and binary forms, with or without
71 1.265 dholland * modification, are permitted provided that the following conditions
72 1.265 dholland * are met:
73 1.265 dholland * 1. Redistributions of source code must retain the above copyright
74 1.265 dholland * notice, this list of conditions and the following disclaimer.
75 1.265 dholland * 2. Redistributions in binary form must reproduce the above copyright
76 1.265 dholland * notice, this list of conditions and the following disclaimer in the
77 1.265 dholland * documentation and/or other materials provided with the distribution.
78 1.265 dholland *
79 1.265 dholland * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
80 1.265 dholland * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
81 1.265 dholland * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
82 1.265 dholland * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
83 1.265 dholland * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
84 1.265 dholland * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
85 1.265 dholland * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
86 1.265 dholland * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
87 1.265 dholland * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
88 1.265 dholland * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
89 1.265 dholland * POSSIBILITY OF SUCH DAMAGE.
90 1.265 dholland */
91 1.265 dholland /*
92 1.265 dholland * Copyright (c) 1982, 1986, 1989, 1993, 1995
93 1.265 dholland * The Regents of the University of California. All rights reserved.
94 1.265 dholland * (c) UNIX System Laboratories, Inc.
95 1.265 dholland * All or some portions of this file are derived from material licensed
96 1.265 dholland * to the University of California by American Telephone and Telegraph
97 1.265 dholland * Co. or Unix System Laboratories, Inc. and are reproduced herein with
98 1.265 dholland * the permission of UNIX System Laboratories, Inc.
99 1.265 dholland *
100 1.265 dholland * Redistribution and use in source and binary forms, with or without
101 1.265 dholland * modification, are permitted provided that the following conditions
102 1.265 dholland * are met:
103 1.265 dholland * 1. Redistributions of source code must retain the above copyright
104 1.265 dholland * notice, this list of conditions and the following disclaimer.
105 1.265 dholland * 2. Redistributions in binary form must reproduce the above copyright
106 1.265 dholland * notice, this list of conditions and the following disclaimer in the
107 1.265 dholland * documentation and/or other materials provided with the distribution.
108 1.265 dholland * 3. Neither the name of the University nor the names of its contributors
109 1.265 dholland * may be used to endorse or promote products derived from this software
110 1.265 dholland * without specific prior written permission.
111 1.265 dholland *
112 1.265 dholland * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
113 1.265 dholland * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
114 1.265 dholland * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
115 1.265 dholland * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
116 1.265 dholland * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
117 1.265 dholland * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
118 1.265 dholland * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
119 1.265 dholland * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
120 1.265 dholland * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
121 1.265 dholland * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
122 1.265 dholland * SUCH DAMAGE.
123 1.265 dholland *
124 1.265 dholland * @(#)ufs_vnops.c 8.28 (Berkeley) 7/31/95
125 1.265 dholland */
126 1.265 dholland
127 1.58 lukem #include <sys/cdefs.h>
128 1.333 christos __KERNEL_RCSID(0, "$NetBSD: lfs_vnops.c,v 1.333 2020/05/16 18:31:53 christos Exp $");
129 1.182 martin
130 1.183 martin #ifdef _KERNEL_OPT
131 1.182 martin #include "opt_compat_netbsd.h"
132 1.238 chs #include "opt_uvm_page_trkown.h"
133 1.183 martin #endif
134 1.17 sommerfe
135 1.1 mycroft #include <sys/param.h>
136 1.1 mycroft #include <sys/systm.h>
137 1.1 mycroft #include <sys/namei.h>
138 1.1 mycroft #include <sys/resourcevar.h>
139 1.1 mycroft #include <sys/kernel.h>
140 1.1 mycroft #include <sys/file.h>
141 1.1 mycroft #include <sys/stat.h>
142 1.1 mycroft #include <sys/buf.h>
143 1.1 mycroft #include <sys/proc.h>
144 1.1 mycroft #include <sys/mount.h>
145 1.1 mycroft #include <sys/vnode.h>
146 1.19 thorpej #include <sys/pool.h>
147 1.10 christos #include <sys/signalvar.h>
148 1.176 elad #include <sys/kauth.h>
149 1.179 perseant #include <sys/syslog.h>
150 1.1 mycroft
151 1.12 mycroft #include <miscfs/fifofs/fifo.h>
152 1.12 mycroft #include <miscfs/genfs/genfs.h>
153 1.1 mycroft #include <miscfs/specfs/specdev.h>
154 1.1 mycroft
155 1.244 dholland #include <ufs/lfs/ulfs_inode.h>
156 1.244 dholland #include <ufs/lfs/ulfsmount.h>
157 1.244 dholland #include <ufs/lfs/ulfs_bswap.h>
158 1.244 dholland #include <ufs/lfs/ulfs_extern.h>
159 1.1 mycroft
160 1.84 perseant #include <uvm/uvm.h>
161 1.95 perseant #include <uvm/uvm_pmap.h>
162 1.95 perseant #include <uvm/uvm_stat.h>
163 1.95 perseant #include <uvm/uvm_pager.h>
164 1.84 perseant
165 1.1 mycroft #include <ufs/lfs/lfs.h>
166 1.278 dholland #include <ufs/lfs/lfs_accessors.h>
167 1.252 dholland #include <ufs/lfs/lfs_kernel.h>
168 1.1 mycroft #include <ufs/lfs/lfs_extern.h>
169 1.1 mycroft
170 1.310 maya extern kcondvar_t lfs_writerd_cv;
171 1.203 perseant int lfs_ignore_lazy_sync = 1;
172 1.203 perseant
173 1.254 dholland static int lfs_openextattr(void *v);
174 1.254 dholland static int lfs_closeextattr(void *v);
175 1.254 dholland static int lfs_getextattr(void *v);
176 1.254 dholland static int lfs_setextattr(void *v);
177 1.254 dholland static int lfs_listextattr(void *v);
178 1.254 dholland static int lfs_deleteextattr(void *v);
179 1.254 dholland
180 1.300 dholland static int lfs_makeinode(struct vattr *vap, struct vnode *,
181 1.299 dholland const struct ulfs_lookup_results *,
182 1.299 dholland struct vnode **, struct componentname *);
183 1.299 dholland
184 1.1 mycroft /* Global vfs data structures for lfs. */
185 1.51 perseant int (**lfs_vnodeop_p)(void *);
186 1.50 jdolecek const struct vnodeopv_entry_desc lfs_vnodeop_entries[] = {
187 1.1 mycroft { &vop_default_desc, vn_default_error },
188 1.245 dholland { &vop_lookup_desc, ulfs_lookup }, /* lookup */
189 1.22 perseant { &vop_create_desc, lfs_create }, /* create */
190 1.245 dholland { &vop_whiteout_desc, ulfs_whiteout }, /* whiteout */
191 1.22 perseant { &vop_mknod_desc, lfs_mknod }, /* mknod */
192 1.245 dholland { &vop_open_desc, ulfs_open }, /* open */
193 1.1 mycroft { &vop_close_desc, lfs_close }, /* close */
194 1.245 dholland { &vop_access_desc, ulfs_access }, /* access */
195 1.333 christos { &vop_accessx_desc, genfs_accessx }, /* accessx */
196 1.1 mycroft { &vop_getattr_desc, lfs_getattr }, /* getattr */
197 1.61 perseant { &vop_setattr_desc, lfs_setattr }, /* setattr */
198 1.1 mycroft { &vop_read_desc, lfs_read }, /* read */
199 1.1 mycroft { &vop_write_desc, lfs_write }, /* write */
200 1.269 dholland { &vop_fallocate_desc, genfs_eopnotsupp }, /* fallocate */
201 1.269 dholland { &vop_fdiscard_desc, genfs_eopnotsupp }, /* fdiscard */
202 1.245 dholland { &vop_ioctl_desc, ulfs_ioctl }, /* ioctl */
203 1.90 perseant { &vop_fcntl_desc, lfs_fcntl }, /* fcntl */
204 1.245 dholland { &vop_poll_desc, ulfs_poll }, /* poll */
205 1.68 jdolecek { &vop_kqfilter_desc, genfs_kqfilter }, /* kqfilter */
206 1.245 dholland { &vop_revoke_desc, ulfs_revoke }, /* revoke */
207 1.84 perseant { &vop_mmap_desc, lfs_mmap }, /* mmap */
208 1.1 mycroft { &vop_fsync_desc, lfs_fsync }, /* fsync */
209 1.245 dholland { &vop_seek_desc, ulfs_seek }, /* seek */
210 1.22 perseant { &vop_remove_desc, lfs_remove }, /* remove */
211 1.22 perseant { &vop_link_desc, lfs_link }, /* link */
212 1.22 perseant { &vop_rename_desc, lfs_rename }, /* rename */
213 1.22 perseant { &vop_mkdir_desc, lfs_mkdir }, /* mkdir */
214 1.22 perseant { &vop_rmdir_desc, lfs_rmdir }, /* rmdir */
215 1.22 perseant { &vop_symlink_desc, lfs_symlink }, /* symlink */
216 1.245 dholland { &vop_readdir_desc, ulfs_readdir }, /* readdir */
217 1.245 dholland { &vop_readlink_desc, ulfs_readlink }, /* readlink */
218 1.245 dholland { &vop_abortop_desc, ulfs_abortop }, /* abortop */
219 1.40 perseant { &vop_inactive_desc, lfs_inactive }, /* inactive */
220 1.1 mycroft { &vop_reclaim_desc, lfs_reclaim }, /* reclaim */
221 1.245 dholland { &vop_lock_desc, ulfs_lock }, /* lock */
222 1.245 dholland { &vop_unlock_desc, ulfs_unlock }, /* unlock */
223 1.245 dholland { &vop_bmap_desc, ulfs_bmap }, /* bmap */
224 1.94 perseant { &vop_strategy_desc, lfs_strategy }, /* strategy */
225 1.245 dholland { &vop_print_desc, ulfs_print }, /* print */
226 1.245 dholland { &vop_islocked_desc, ulfs_islocked }, /* islocked */
227 1.245 dholland { &vop_pathconf_desc, ulfs_pathconf }, /* pathconf */
228 1.245 dholland { &vop_advlock_desc, ulfs_advlock }, /* advlock */
229 1.1 mycroft { &vop_bwrite_desc, lfs_bwrite }, /* bwrite */
230 1.60 chs { &vop_getpages_desc, lfs_getpages }, /* getpages */
231 1.60 chs { &vop_putpages_desc, lfs_putpages }, /* putpages */
232 1.254 dholland { &vop_openextattr_desc, lfs_openextattr }, /* openextattr */
233 1.254 dholland { &vop_closeextattr_desc, lfs_closeextattr }, /* closeextattr */
234 1.254 dholland { &vop_getextattr_desc, lfs_getextattr }, /* getextattr */
235 1.254 dholland { &vop_setextattr_desc, lfs_setextattr }, /* setextattr */
236 1.254 dholland { &vop_listextattr_desc, lfs_listextattr }, /* listextattr */
237 1.254 dholland { &vop_deleteextattr_desc, lfs_deleteextattr }, /* deleteextattr */
238 1.53 chs { NULL, NULL }
239 1.1 mycroft };
240 1.50 jdolecek const struct vnodeopv_desc lfs_vnodeop_opv_desc =
241 1.1 mycroft { &lfs_vnodeop_p, lfs_vnodeop_entries };
242 1.1 mycroft
243 1.51 perseant int (**lfs_specop_p)(void *);
244 1.50 jdolecek const struct vnodeopv_entry_desc lfs_specop_entries[] = {
245 1.1 mycroft { &vop_default_desc, vn_default_error },
246 1.1 mycroft { &vop_lookup_desc, spec_lookup }, /* lookup */
247 1.1 mycroft { &vop_create_desc, spec_create }, /* create */
248 1.1 mycroft { &vop_mknod_desc, spec_mknod }, /* mknod */
249 1.1 mycroft { &vop_open_desc, spec_open }, /* open */
250 1.65 perseant { &vop_close_desc, lfsspec_close }, /* close */
251 1.245 dholland { &vop_access_desc, ulfs_access }, /* access */
252 1.333 christos { &vop_accessx_desc, genfs_accessx }, /* accessx */
253 1.1 mycroft { &vop_getattr_desc, lfs_getattr }, /* getattr */
254 1.61 perseant { &vop_setattr_desc, lfs_setattr }, /* setattr */
255 1.245 dholland { &vop_read_desc, ulfsspec_read }, /* read */
256 1.245 dholland { &vop_write_desc, ulfsspec_write }, /* write */
257 1.269 dholland { &vop_fallocate_desc, spec_fallocate }, /* fallocate */
258 1.269 dholland { &vop_fdiscard_desc, spec_fdiscard }, /* fdiscard */
259 1.1 mycroft { &vop_ioctl_desc, spec_ioctl }, /* ioctl */
260 1.245 dholland { &vop_fcntl_desc, ulfs_fcntl }, /* fcntl */
261 1.13 mycroft { &vop_poll_desc, spec_poll }, /* poll */
262 1.68 jdolecek { &vop_kqfilter_desc, spec_kqfilter }, /* kqfilter */
263 1.15 fvdl { &vop_revoke_desc, spec_revoke }, /* revoke */
264 1.1 mycroft { &vop_mmap_desc, spec_mmap }, /* mmap */
265 1.1 mycroft { &vop_fsync_desc, spec_fsync }, /* fsync */
266 1.1 mycroft { &vop_seek_desc, spec_seek }, /* seek */
267 1.1 mycroft { &vop_remove_desc, spec_remove }, /* remove */
268 1.1 mycroft { &vop_link_desc, spec_link }, /* link */
269 1.1 mycroft { &vop_rename_desc, spec_rename }, /* rename */
270 1.1 mycroft { &vop_mkdir_desc, spec_mkdir }, /* mkdir */
271 1.1 mycroft { &vop_rmdir_desc, spec_rmdir }, /* rmdir */
272 1.1 mycroft { &vop_symlink_desc, spec_symlink }, /* symlink */
273 1.1 mycroft { &vop_readdir_desc, spec_readdir }, /* readdir */
274 1.1 mycroft { &vop_readlink_desc, spec_readlink }, /* readlink */
275 1.1 mycroft { &vop_abortop_desc, spec_abortop }, /* abortop */
276 1.40 perseant { &vop_inactive_desc, lfs_inactive }, /* inactive */
277 1.1 mycroft { &vop_reclaim_desc, lfs_reclaim }, /* reclaim */
278 1.245 dholland { &vop_lock_desc, ulfs_lock }, /* lock */
279 1.245 dholland { &vop_unlock_desc, ulfs_unlock }, /* unlock */
280 1.1 mycroft { &vop_bmap_desc, spec_bmap }, /* bmap */
281 1.1 mycroft { &vop_strategy_desc, spec_strategy }, /* strategy */
282 1.245 dholland { &vop_print_desc, ulfs_print }, /* print */
283 1.245 dholland { &vop_islocked_desc, ulfs_islocked }, /* islocked */
284 1.1 mycroft { &vop_pathconf_desc, spec_pathconf }, /* pathconf */
285 1.1 mycroft { &vop_advlock_desc, spec_advlock }, /* advlock */
286 1.28 perseant { &vop_bwrite_desc, vn_bwrite }, /* bwrite */
287 1.53 chs { &vop_getpages_desc, spec_getpages }, /* getpages */
288 1.53 chs { &vop_putpages_desc, spec_putpages }, /* putpages */
289 1.254 dholland { &vop_openextattr_desc, lfs_openextattr }, /* openextattr */
290 1.254 dholland { &vop_closeextattr_desc, lfs_closeextattr }, /* closeextattr */
291 1.254 dholland { &vop_getextattr_desc, lfs_getextattr }, /* getextattr */
292 1.254 dholland { &vop_setextattr_desc, lfs_setextattr }, /* setextattr */
293 1.254 dholland { &vop_listextattr_desc, lfs_listextattr }, /* listextattr */
294 1.254 dholland { &vop_deleteextattr_desc, lfs_deleteextattr }, /* deleteextattr */
295 1.53 chs { NULL, NULL }
296 1.1 mycroft };
297 1.50 jdolecek const struct vnodeopv_desc lfs_specop_opv_desc =
298 1.1 mycroft { &lfs_specop_p, lfs_specop_entries };
299 1.1 mycroft
300 1.51 perseant int (**lfs_fifoop_p)(void *);
301 1.50 jdolecek const struct vnodeopv_entry_desc lfs_fifoop_entries[] = {
302 1.1 mycroft { &vop_default_desc, vn_default_error },
303 1.227 pooka { &vop_lookup_desc, vn_fifo_bypass }, /* lookup */
304 1.227 pooka { &vop_create_desc, vn_fifo_bypass }, /* create */
305 1.227 pooka { &vop_mknod_desc, vn_fifo_bypass }, /* mknod */
306 1.227 pooka { &vop_open_desc, vn_fifo_bypass }, /* open */
307 1.65 perseant { &vop_close_desc, lfsfifo_close }, /* close */
308 1.245 dholland { &vop_access_desc, ulfs_access }, /* access */
309 1.333 christos { &vop_accessx_desc, genfs_accessx }, /* accessx */
310 1.1 mycroft { &vop_getattr_desc, lfs_getattr }, /* getattr */
311 1.61 perseant { &vop_setattr_desc, lfs_setattr }, /* setattr */
312 1.245 dholland { &vop_read_desc, ulfsfifo_read }, /* read */
313 1.245 dholland { &vop_write_desc, ulfsfifo_write }, /* write */
314 1.269 dholland { &vop_fallocate_desc, vn_fifo_bypass }, /* fallocate */
315 1.269 dholland { &vop_fdiscard_desc, vn_fifo_bypass }, /* fdiscard */
316 1.227 pooka { &vop_ioctl_desc, vn_fifo_bypass }, /* ioctl */
317 1.245 dholland { &vop_fcntl_desc, ulfs_fcntl }, /* fcntl */
318 1.227 pooka { &vop_poll_desc, vn_fifo_bypass }, /* poll */
319 1.227 pooka { &vop_kqfilter_desc, vn_fifo_bypass }, /* kqfilter */
320 1.227 pooka { &vop_revoke_desc, vn_fifo_bypass }, /* revoke */
321 1.227 pooka { &vop_mmap_desc, vn_fifo_bypass }, /* mmap */
322 1.227 pooka { &vop_fsync_desc, vn_fifo_bypass }, /* fsync */
323 1.227 pooka { &vop_seek_desc, vn_fifo_bypass }, /* seek */
324 1.227 pooka { &vop_remove_desc, vn_fifo_bypass }, /* remove */
325 1.227 pooka { &vop_link_desc, vn_fifo_bypass }, /* link */
326 1.227 pooka { &vop_rename_desc, vn_fifo_bypass }, /* rename */
327 1.227 pooka { &vop_mkdir_desc, vn_fifo_bypass }, /* mkdir */
328 1.227 pooka { &vop_rmdir_desc, vn_fifo_bypass }, /* rmdir */
329 1.227 pooka { &vop_symlink_desc, vn_fifo_bypass }, /* symlink */
330 1.227 pooka { &vop_readdir_desc, vn_fifo_bypass }, /* readdir */
331 1.227 pooka { &vop_readlink_desc, vn_fifo_bypass }, /* readlink */
332 1.227 pooka { &vop_abortop_desc, vn_fifo_bypass }, /* abortop */
333 1.40 perseant { &vop_inactive_desc, lfs_inactive }, /* inactive */
334 1.1 mycroft { &vop_reclaim_desc, lfs_reclaim }, /* reclaim */
335 1.245 dholland { &vop_lock_desc, ulfs_lock }, /* lock */
336 1.245 dholland { &vop_unlock_desc, ulfs_unlock }, /* unlock */
337 1.227 pooka { &vop_bmap_desc, vn_fifo_bypass }, /* bmap */
338 1.227 pooka { &vop_strategy_desc, vn_fifo_bypass }, /* strategy */
339 1.245 dholland { &vop_print_desc, ulfs_print }, /* print */
340 1.245 dholland { &vop_islocked_desc, ulfs_islocked }, /* islocked */
341 1.227 pooka { &vop_pathconf_desc, vn_fifo_bypass }, /* pathconf */
342 1.227 pooka { &vop_advlock_desc, vn_fifo_bypass }, /* advlock */
343 1.1 mycroft { &vop_bwrite_desc, lfs_bwrite }, /* bwrite */
344 1.227 pooka { &vop_putpages_desc, vn_fifo_bypass }, /* putpages */
345 1.254 dholland { &vop_openextattr_desc, lfs_openextattr }, /* openextattr */
346 1.254 dholland { &vop_closeextattr_desc, lfs_closeextattr }, /* closeextattr */
347 1.254 dholland { &vop_getextattr_desc, lfs_getextattr }, /* getextattr */
348 1.254 dholland { &vop_setextattr_desc, lfs_setextattr }, /* setextattr */
349 1.254 dholland { &vop_listextattr_desc, lfs_listextattr }, /* listextattr */
350 1.254 dholland { &vop_deleteextattr_desc, lfs_deleteextattr }, /* deleteextattr */
351 1.53 chs { NULL, NULL }
352 1.1 mycroft };
353 1.50 jdolecek const struct vnodeopv_desc lfs_fifoop_opv_desc =
354 1.1 mycroft { &lfs_fifoop_p, lfs_fifoop_entries };
355 1.1 mycroft
356 1.244 dholland #include <ufs/lfs/ulfs_readwrite.c>
357 1.1 mycroft
358 1.1 mycroft /*
359 1.299 dholland * Allocate a new inode.
360 1.299 dholland */
361 1.299 dholland static int
362 1.300 dholland lfs_makeinode(struct vattr *vap, struct vnode *dvp,
363 1.299 dholland const struct ulfs_lookup_results *ulr,
364 1.299 dholland struct vnode **vpp, struct componentname *cnp)
365 1.299 dholland {
366 1.299 dholland struct inode *ip;
367 1.299 dholland struct vnode *tvp;
368 1.299 dholland int error;
369 1.299 dholland
370 1.323 hannken error = vcache_new(dvp->v_mount, dvp, vap, cnp->cn_cred, NULL, &tvp);
371 1.299 dholland if (error)
372 1.299 dholland return error;
373 1.299 dholland error = vn_lock(tvp, LK_EXCLUSIVE);
374 1.299 dholland if (error) {
375 1.299 dholland vrele(tvp);
376 1.299 dholland return error;
377 1.299 dholland }
378 1.319 maya MARK_VNODE(tvp);
379 1.299 dholland *vpp = tvp;
380 1.299 dholland ip = VTOI(tvp);
381 1.317 maya ip->i_state |= IN_ACCESS | IN_CHANGE | IN_UPDATE;
382 1.299 dholland ip->i_nlink = 1;
383 1.299 dholland DIP_ASSIGN(ip, nlink, 1);
384 1.299 dholland
385 1.299 dholland /* Authorize setting SGID if needed. */
386 1.299 dholland if (ip->i_mode & ISGID) {
387 1.333 christos error = kauth_authorize_vnode(cnp->cn_cred,
388 1.333 christos KAUTH_VNODE_WRITE_SECURITY,
389 1.333 christos tvp, NULL, genfs_can_chmod(tvp, cnp->cn_cred, ip->i_uid,
390 1.299 dholland ip->i_gid, MAKEIMODE(vap->va_type, vap->va_mode)));
391 1.299 dholland if (error) {
392 1.299 dholland ip->i_mode &= ~ISGID;
393 1.299 dholland DIP_ASSIGN(ip, mode, ip->i_mode);
394 1.299 dholland }
395 1.299 dholland }
396 1.299 dholland
397 1.299 dholland if (cnp->cn_flags & ISWHITEOUT) {
398 1.299 dholland ip->i_flags |= UF_OPAQUE;
399 1.299 dholland DIP_ASSIGN(ip, flags, ip->i_flags);
400 1.299 dholland }
401 1.299 dholland
402 1.299 dholland /*
403 1.299 dholland * Make sure inode goes to disk before directory entry.
404 1.299 dholland */
405 1.299 dholland if ((error = lfs_update(tvp, NULL, NULL, UPDATE_DIROP)) != 0)
406 1.299 dholland goto bad;
407 1.299 dholland error = ulfs_direnter(dvp, ulr, tvp,
408 1.299 dholland cnp, ip->i_number, LFS_IFTODT(ip->i_mode), NULL);
409 1.299 dholland if (error)
410 1.299 dholland goto bad;
411 1.299 dholland *vpp = tvp;
412 1.325 christos cache_enter(dvp, *vpp, cnp->cn_nameptr, cnp->cn_namelen, cnp->cn_flags);
413 1.311 riastrad KASSERT(VOP_ISLOCKED(*vpp) == LK_EXCLUSIVE);
414 1.299 dholland return (0);
415 1.299 dholland
416 1.299 dholland bad:
417 1.299 dholland /*
418 1.299 dholland * Write error occurred trying to update the inode
419 1.299 dholland * or the directory so must deallocate the inode.
420 1.299 dholland */
421 1.299 dholland ip->i_nlink = 0;
422 1.299 dholland DIP_ASSIGN(ip, nlink, 0);
423 1.317 maya ip->i_state |= IN_CHANGE;
424 1.299 dholland /* If IN_ADIROP, account for it */
425 1.319 maya UNMARK_VNODE(tvp);
426 1.299 dholland vput(tvp);
427 1.299 dholland return (error);
428 1.299 dholland }
429 1.299 dholland
430 1.299 dholland /*
431 1.1 mycroft * Synch an open file.
432 1.1 mycroft */
433 1.1 mycroft /* ARGSUSED */
434 1.10 christos int
435 1.51 perseant lfs_fsync(void *v)
436 1.10 christos {
437 1.1 mycroft struct vop_fsync_args /* {
438 1.1 mycroft struct vnode *a_vp;
439 1.176 elad kauth_cred_t a_cred;
440 1.22 perseant int a_flags;
441 1.49 toshii off_t offlo;
442 1.49 toshii off_t offhi;
443 1.10 christos } */ *ap = v;
444 1.60 chs struct vnode *vp = ap->a_vp;
445 1.311 riastrad int wait;
446 1.203 perseant struct inode *ip = VTOI(vp);
447 1.203 perseant struct lfs *fs = ip->i_lfs;
448 1.311 riastrad int error = 0;
449 1.311 riastrad
450 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
451 1.84 perseant
452 1.161 perseant /* If we're mounted read-only, don't try to sync. */
453 1.203 perseant if (fs->lfs_ronly)
454 1.311 riastrad goto out;
455 1.161 perseant
456 1.231 hannken /* If a removed vnode is being cleaned, no need to sync here. */
457 1.231 hannken if ((ap->a_flags & FSYNC_RECLAIM) != 0 && ip->i_mode == 0)
458 1.311 riastrad goto out;
459 1.231 hannken
460 1.86 perseant /*
461 1.203 perseant * Trickle sync simply adds this vnode to the pager list, as if
462 1.203 perseant * the pagedaemon had requested a pageout.
463 1.86 perseant */
464 1.84 perseant if (ap->a_flags & FSYNC_LAZY) {
465 1.203 perseant if (lfs_ignore_lazy_sync == 0) {
466 1.214 ad mutex_enter(&lfs_lock);
467 1.317 maya if (!(ip->i_state & IN_PAGING)) {
468 1.317 maya ip->i_state |= IN_PAGING;
469 1.203 perseant TAILQ_INSERT_TAIL(&fs->lfs_pchainhd, ip,
470 1.203 perseant i_lfs_pchain);
471 1.203 perseant }
472 1.310 maya cv_broadcast(&lfs_writerd_cv);
473 1.214 ad mutex_exit(&lfs_lock);
474 1.203 perseant }
475 1.311 riastrad goto out;
476 1.84 perseant }
477 1.47 perseant
478 1.175 perseant /*
479 1.321 maya * If a vnode is being cleaned, flush it out before we try to
480 1.188 perseant * reuse it. This prevents the cleaner from writing files twice
481 1.188 perseant * in the same partial segment, causing an accounting underflow.
482 1.188 perseant */
483 1.317 maya if (ap->a_flags & FSYNC_RECLAIM && ip->i_state & IN_CLEANING) {
484 1.188 perseant lfs_vflush(vp);
485 1.175 perseant }
486 1.175 perseant
487 1.84 perseant wait = (ap->a_flags & FSYNC_WAIT);
488 1.203 perseant do {
489 1.331 ad rw_enter(vp->v_uobj.vmobjlock, RW_WRITER);
490 1.203 perseant error = VOP_PUTPAGES(vp, trunc_page(ap->a_offlo),
491 1.203 perseant round_page(ap->a_offhi),
492 1.203 perseant PGO_CLEANIT | (wait ? PGO_SYNCIO : 0));
493 1.205 perseant if (error == EAGAIN) {
494 1.214 ad mutex_enter(&lfs_lock);
495 1.274 dholland mtsleep(&fs->lfs_availsleep, PCATCH | PUSER,
496 1.274 dholland "lfs_fsync", hz / 100 + 1, &lfs_lock);
497 1.214 ad mutex_exit(&lfs_lock);
498 1.205 perseant }
499 1.203 perseant } while (error == EAGAIN);
500 1.103 perseant if (error)
501 1.311 riastrad goto out;
502 1.203 perseant
503 1.203 perseant if ((ap->a_flags & FSYNC_DATAONLY) == 0)
504 1.203 perseant error = lfs_update(vp, NULL, NULL, wait ? UPDATE_WAIT : 0);
505 1.203 perseant
506 1.133 wrstuden if (error == 0 && ap->a_flags & FSYNC_CACHE) {
507 1.133 wrstuden int l = 0;
508 1.203 perseant error = VOP_IOCTL(ip->i_devvp, DIOCCACHESYNC, &l, FWRITE,
509 1.213 pooka curlwp->l_cred);
510 1.133 wrstuden }
511 1.103 perseant if (wait && !VPISEMPTY(vp))
512 1.203 perseant LFS_SET_UINO(ip, IN_MODIFIED);
513 1.84 perseant
514 1.311 riastrad out:
515 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
516 1.63 perseant return error;
517 1.1 mycroft }
518 1.1 mycroft
519 1.1 mycroft /*
520 1.245 dholland * Take IN_ADIROP off, then call ulfs_inactive.
521 1.40 perseant */
522 1.40 perseant int
523 1.51 perseant lfs_inactive(void *v)
524 1.40 perseant {
525 1.313 riastrad struct vop_inactive_v2_args /* {
526 1.40 perseant struct vnode *a_vp;
527 1.313 riastrad bool *a_recycle;
528 1.40 perseant } */ *ap = v;
529 1.72 yamt
530 1.311 riastrad KASSERT(VOP_ISLOCKED(ap->a_vp) == LK_EXCLUSIVE);
531 1.311 riastrad
532 1.319 maya UNMARK_VNODE(ap->a_vp);
533 1.76 yamt
534 1.97 perseant /*
535 1.97 perseant * The Ifile is only ever inactivated on unmount.
536 1.97 perseant * Streamline this process by not giving it more dirty blocks.
537 1.97 perseant */
538 1.97 perseant if (VTOI(ap->a_vp)->i_number == LFS_IFILE_INUM) {
539 1.214 ad mutex_enter(&lfs_lock);
540 1.97 perseant LFS_CLR_UINO(VTOI(ap->a_vp), IN_ALLMOD);
541 1.214 ad mutex_exit(&lfs_lock);
542 1.97 perseant return 0;
543 1.97 perseant }
544 1.97 perseant
545 1.239 perseant #ifdef DEBUG
546 1.239 perseant /*
547 1.239 perseant * This might happen on unmount.
548 1.239 perseant * XXX If it happens at any other time, it should be a panic.
549 1.239 perseant */
550 1.239 perseant if (ap->a_vp->v_uflag & VU_DIROP) {
551 1.239 perseant struct inode *ip = VTOI(ap->a_vp);
552 1.306 maya printf("lfs_inactive: inactivating VU_DIROP? ino = %llu\n",
553 1.306 maya (unsigned long long) ip->i_number);
554 1.239 perseant }
555 1.239 perseant #endif /* DIAGNOSTIC */
556 1.239 perseant
557 1.245 dholland return ulfs_inactive(v);
558 1.40 perseant }
559 1.40 perseant
560 1.249 dholland int
561 1.138 perseant lfs_set_dirop(struct vnode *dvp, struct vnode *vp)
562 1.40 perseant {
563 1.24 perseant struct lfs *fs;
564 1.24 perseant int error;
565 1.24 perseant
566 1.311 riastrad KASSERT(VOP_ISLOCKED(dvp) == LK_EXCLUSIVE);
567 1.311 riastrad KASSERT(vp == NULL || VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
568 1.71 yamt
569 1.138 perseant fs = VTOI(dvp)->i_lfs;
570 1.141 perseant
571 1.141 perseant ASSERT_NO_SEGLOCK(fs);
572 1.44 perseant /*
573 1.134 perseant * LFS_NRESERVE calculates direct and indirect blocks as well
574 1.134 perseant * as an inode block; an overestimate in most cases.
575 1.44 perseant */
576 1.138 perseant if ((error = lfs_reserve(fs, dvp, vp, LFS_NRESERVE(fs))) != 0)
577 1.44 perseant return (error);
578 1.70 yamt
579 1.214 ad restart:
580 1.214 ad mutex_enter(&lfs_lock);
581 1.141 perseant if (fs->lfs_dirops == 0) {
582 1.214 ad mutex_exit(&lfs_lock);
583 1.138 perseant lfs_check(dvp, LFS_UNUSED_LBN, 0);
584 1.214 ad mutex_enter(&lfs_lock);
585 1.113 yamt }
586 1.190 perseant while (fs->lfs_writer) {
587 1.309 maya error = cv_wait_sig(&fs->lfs_diropscv, &lfs_lock);
588 1.190 perseant if (error == EINTR) {
589 1.214 ad mutex_exit(&lfs_lock);
590 1.190 perseant goto unreserve;
591 1.190 perseant }
592 1.190 perseant }
593 1.113 yamt if (lfs_dirvcount > LFS_MAX_DIROP && fs->lfs_dirops == 0) {
594 1.310 maya cv_broadcast(&lfs_writerd_cv);
595 1.214 ad mutex_exit(&lfs_lock);
596 1.198 ad preempt();
597 1.113 yamt goto restart;
598 1.113 yamt }
599 1.33 perseant
600 1.113 yamt if (lfs_dirvcount > LFS_MAX_DIROP) {
601 1.136 perseant DLOG((DLOG_DIROP, "lfs_set_dirop: sleeping with dirops=%d, "
602 1.136 perseant "dirvcount=%d\n", fs->lfs_dirops, lfs_dirvcount));
603 1.214 ad if ((error = mtsleep(&lfs_dirvcount,
604 1.214 ad PCATCH | PUSER | PNORELOCK, "lfs_maxdirop", 0,
605 1.214 ad &lfs_lock)) != 0) {
606 1.304 maya mutex_exit(&lfs_lock);
607 1.113 yamt goto unreserve;
608 1.113 yamt }
609 1.304 maya mutex_exit(&lfs_lock);
610 1.113 yamt goto restart;
611 1.135 perry }
612 1.113 yamt
613 1.135 perry ++fs->lfs_dirops;
614 1.239 perseant /* fs->lfs_doifile = 1; */ /* XXX why? --ks */
615 1.214 ad mutex_exit(&lfs_lock);
616 1.24 perseant
617 1.46 perseant /* Hold a reference so SET_ENDOP will be happy */
618 1.138 perseant vref(dvp);
619 1.138 perseant if (vp) {
620 1.138 perseant vref(vp);
621 1.138 perseant MARK_VNODE(vp);
622 1.138 perseant }
623 1.46 perseant
624 1.138 perseant MARK_VNODE(dvp);
625 1.24 perseant return 0;
626 1.70 yamt
627 1.203 perseant unreserve:
628 1.138 perseant lfs_reserve(fs, dvp, vp, -LFS_NRESERVE(fs));
629 1.70 yamt return error;
630 1.1 mycroft }
631 1.1 mycroft
632 1.138 perseant /*
633 1.264 dholland * Opposite of lfs_set_dirop... mostly. For now at least must call
634 1.264 dholland * UNMARK_VNODE(dvp) explicitly first. (XXX: clean that up)
635 1.138 perseant */
636 1.264 dholland void
637 1.264 dholland lfs_unset_dirop(struct lfs *fs, struct vnode *dvp, const char *str)
638 1.138 perseant {
639 1.264 dholland mutex_enter(&lfs_lock);
640 1.264 dholland --fs->lfs_dirops;
641 1.264 dholland if (!fs->lfs_dirops) {
642 1.264 dholland if (fs->lfs_nadirop) {
643 1.264 dholland panic("lfs_unset_dirop: %s: no dirops but "
644 1.264 dholland " nadirop=%d", str,
645 1.264 dholland fs->lfs_nadirop);
646 1.264 dholland }
647 1.264 dholland wakeup(&fs->lfs_writer);
648 1.264 dholland mutex_exit(&lfs_lock);
649 1.264 dholland lfs_check(dvp, LFS_UNUSED_LBN, 0);
650 1.264 dholland } else {
651 1.264 dholland mutex_exit(&lfs_lock);
652 1.138 perseant }
653 1.264 dholland lfs_reserve(fs, dvp, NULL, -LFS_NRESERVE(fs));
654 1.1 mycroft }
655 1.1 mycroft
656 1.117 yamt void
657 1.117 yamt lfs_mark_vnode(struct vnode *vp)
658 1.117 yamt {
659 1.117 yamt struct inode *ip = VTOI(vp);
660 1.117 yamt struct lfs *fs = ip->i_lfs;
661 1.37 perseant
662 1.214 ad mutex_enter(&lfs_lock);
663 1.317 maya if (!(ip->i_state & IN_ADIROP)) {
664 1.212 ad if (!(vp->v_uflag & VU_DIROP)) {
665 1.240 perseant mutex_exit(&lfs_lock);
666 1.272 hannken vref(vp);
667 1.240 perseant mutex_enter(&lfs_lock);
668 1.117 yamt ++lfs_dirvcount;
669 1.173 perseant ++fs->lfs_dirvcount;
670 1.117 yamt TAILQ_INSERT_TAIL(&fs->lfs_dchainhd, ip, i_lfs_dchain);
671 1.212 ad vp->v_uflag |= VU_DIROP;
672 1.117 yamt }
673 1.117 yamt ++fs->lfs_nadirop;
674 1.317 maya ip->i_state &= ~IN_CDIROP;
675 1.317 maya ip->i_state |= IN_ADIROP;
676 1.117 yamt } else
677 1.212 ad KASSERT(vp->v_uflag & VU_DIROP);
678 1.214 ad mutex_exit(&lfs_lock);
679 1.117 yamt }
680 1.40 perseant
681 1.117 yamt void
682 1.117 yamt lfs_unmark_vnode(struct vnode *vp)
683 1.40 perseant {
684 1.117 yamt struct inode *ip = VTOI(vp);
685 1.40 perseant
686 1.240 perseant mutex_enter(&lfs_lock);
687 1.317 maya if (ip && (ip->i_state & IN_ADIROP)) {
688 1.212 ad KASSERT(vp->v_uflag & VU_DIROP);
689 1.40 perseant --ip->i_lfs->lfs_nadirop;
690 1.317 maya ip->i_state &= ~IN_ADIROP;
691 1.117 yamt }
692 1.240 perseant mutex_exit(&lfs_lock);
693 1.40 perseant }
694 1.15 fvdl
695 1.1 mycroft int
696 1.51 perseant lfs_symlink(void *v)
697 1.10 christos {
698 1.261 hannken struct vop_symlink_v3_args /* {
699 1.1 mycroft struct vnode *a_dvp;
700 1.1 mycroft struct vnode **a_vpp;
701 1.1 mycroft struct componentname *a_cnp;
702 1.1 mycroft struct vattr *a_vap;
703 1.1 mycroft char *a_target;
704 1.10 christos } */ *ap = v;
705 1.264 dholland struct lfs *fs;
706 1.264 dholland struct vnode *dvp, **vpp;
707 1.266 dholland struct inode *ip;
708 1.266 dholland struct ulfs_lookup_results *ulr;
709 1.266 dholland ssize_t len; /* XXX should be size_t */
710 1.37 perseant int error;
711 1.1 mycroft
712 1.264 dholland dvp = ap->a_dvp;
713 1.264 dholland vpp = ap->a_vpp;
714 1.264 dholland
715 1.311 riastrad KASSERT(VOP_ISLOCKED(dvp) == LK_EXCLUSIVE);
716 1.264 dholland KASSERT(vpp != NULL);
717 1.264 dholland KASSERT(*vpp == NULL);
718 1.272 hannken KASSERT(ap->a_vap->va_type == VLNK);
719 1.264 dholland
720 1.266 dholland /* XXX should handle this material another way */
721 1.266 dholland ulr = &VTOI(ap->a_dvp)->i_crap;
722 1.266 dholland ULFS_CHECK_CRAPCOUNTER(VTOI(ap->a_dvp));
723 1.266 dholland
724 1.264 dholland fs = VFSTOULFS(dvp->v_mount)->um_lfs;
725 1.264 dholland ASSERT_NO_SEGLOCK(fs);
726 1.264 dholland if (fs->lfs_ronly) {
727 1.264 dholland return EROFS;
728 1.264 dholland }
729 1.264 dholland
730 1.264 dholland error = lfs_set_dirop(dvp, NULL);
731 1.272 hannken if (error)
732 1.37 perseant return error;
733 1.264 dholland
734 1.300 dholland error = lfs_makeinode(ap->a_vap, dvp, ulr, vpp, ap->a_cnp);
735 1.266 dholland if (error) {
736 1.266 dholland goto out;
737 1.266 dholland }
738 1.311 riastrad KASSERT(VOP_ISLOCKED(*vpp) == LK_EXCLUSIVE);
739 1.266 dholland
740 1.266 dholland VN_KNOTE(ap->a_dvp, NOTE_WRITE);
741 1.266 dholland ip = VTOI(*vpp);
742 1.266 dholland
743 1.294 dholland /*
744 1.294 dholland * This test is off by one. um_maxsymlinklen contains the
745 1.294 dholland * number of bytes available, and we aren't storing a \0, so
746 1.294 dholland * the test should properly be <=. However, it cannot be
747 1.294 dholland * changed as this would break compatibility with existing fs
748 1.294 dholland * images -- see the way ulfs_readlink() works.
749 1.294 dholland */
750 1.266 dholland len = strlen(ap->a_target);
751 1.266 dholland if (len < ip->i_lfs->um_maxsymlinklen) {
752 1.266 dholland memcpy((char *)SHORTLINK(ip), ap->a_target, len);
753 1.266 dholland ip->i_size = len;
754 1.266 dholland DIP_ASSIGN(ip, size, len);
755 1.266 dholland uvm_vnp_setsize(*vpp, ip->i_size);
756 1.317 maya ip->i_state |= IN_CHANGE | IN_UPDATE;
757 1.266 dholland if ((*vpp)->v_mount->mnt_flag & MNT_RELATIME)
758 1.317 maya ip->i_state |= IN_ACCESS;
759 1.266 dholland } else {
760 1.270 riastrad error = ulfs_bufio(UIO_WRITE, *vpp, ap->a_target, len, (off_t)0,
761 1.270 riastrad IO_NODELOCKED | IO_JOURNALLOCKED, ap->a_cnp->cn_cred, NULL,
762 1.270 riastrad NULL);
763 1.266 dholland }
764 1.266 dholland
765 1.266 dholland VOP_UNLOCK(*vpp);
766 1.266 dholland if (error)
767 1.266 dholland vrele(*vpp);
768 1.266 dholland
769 1.266 dholland out:
770 1.264 dholland UNMARK_VNODE(dvp);
771 1.264 dholland /* XXX: is it even possible for the symlink to get MARK'd? */
772 1.264 dholland UNMARK_VNODE(*vpp);
773 1.281 dholland if (error) {
774 1.264 dholland *vpp = NULL;
775 1.264 dholland }
776 1.264 dholland lfs_unset_dirop(fs, dvp, "symlink");
777 1.264 dholland
778 1.264 dholland vrele(dvp);
779 1.37 perseant return (error);
780 1.1 mycroft }
781 1.1 mycroft
782 1.1 mycroft int
783 1.51 perseant lfs_mknod(void *v)
784 1.10 christos {
785 1.261 hannken struct vop_mknod_v3_args /* {
786 1.1 mycroft struct vnode *a_dvp;
787 1.1 mycroft struct vnode **a_vpp;
788 1.1 mycroft struct componentname *a_cnp;
789 1.1 mycroft struct vattr *a_vap;
790 1.203 perseant } */ *ap = v;
791 1.264 dholland struct lfs *fs;
792 1.264 dholland struct vnode *dvp, **vpp;
793 1.250 dholland struct vattr *vap;
794 1.86 perseant struct inode *ip;
795 1.86 perseant int error;
796 1.52 assar ino_t ino;
797 1.245 dholland struct ulfs_lookup_results *ulr;
798 1.237 dholland
799 1.264 dholland dvp = ap->a_dvp;
800 1.264 dholland vpp = ap->a_vpp;
801 1.250 dholland vap = ap->a_vap;
802 1.250 dholland
803 1.311 riastrad KASSERT(VOP_ISLOCKED(dvp) == LK_EXCLUSIVE);
804 1.264 dholland KASSERT(vpp != NULL);
805 1.264 dholland KASSERT(*vpp == NULL);
806 1.311 riastrad
807 1.237 dholland /* XXX should handle this material another way */
808 1.264 dholland ulr = &VTOI(dvp)->i_crap;
809 1.264 dholland ULFS_CHECK_CRAPCOUNTER(VTOI(dvp));
810 1.264 dholland
811 1.264 dholland fs = VFSTOULFS(dvp->v_mount)->um_lfs;
812 1.264 dholland ASSERT_NO_SEGLOCK(fs);
813 1.264 dholland if (fs->lfs_ronly) {
814 1.264 dholland return EROFS;
815 1.264 dholland }
816 1.264 dholland
817 1.264 dholland error = lfs_set_dirop(dvp, NULL);
818 1.272 hannken if (error)
819 1.28 perseant return error;
820 1.250 dholland
821 1.300 dholland error = lfs_makeinode(vap, dvp, ulr, vpp, ap->a_cnp);
822 1.28 perseant
823 1.28 perseant /* Either way we're done with the dirop at this point */
824 1.264 dholland UNMARK_VNODE(dvp);
825 1.264 dholland UNMARK_VNODE(*vpp);
826 1.264 dholland lfs_unset_dirop(fs, dvp, "mknod");
827 1.28 perseant
828 1.250 dholland if (error) {
829 1.303 dholland vrele(dvp);
830 1.250 dholland *vpp = NULL;
831 1.28 perseant return (error);
832 1.250 dholland }
833 1.311 riastrad KASSERT(VOP_ISLOCKED(*vpp) == LK_EXCLUSIVE);
834 1.28 perseant
835 1.264 dholland VN_KNOTE(dvp, NOTE_WRITE);
836 1.86 perseant ip = VTOI(*vpp);
837 1.52 assar ino = ip->i_number;
838 1.317 maya ip->i_state |= IN_ACCESS | IN_CHANGE | IN_UPDATE;
839 1.134 perseant
840 1.28 perseant /*
841 1.28 perseant * Call fsync to write the vnode so that we don't have to deal with
842 1.262 hannken * flushing it when it's marked VU_DIROP or reclaiming.
843 1.28 perseant *
844 1.28 perseant * XXX KS - If we can't flush we also can't call vgone(), so must
845 1.28 perseant * return. But, that leaves this vnode in limbo, also not good.
846 1.28 perseant * Can this ever happen (barring hardware failure)?
847 1.28 perseant */
848 1.213 pooka if ((error = VOP_FSYNC(*vpp, NOCRED, FSYNC_WAIT, 0, 0)) != 0) {
849 1.306 maya panic("lfs_mknod: couldn't fsync (ino %llu)",
850 1.306 maya (unsigned long long) ino);
851 1.136 perseant /* return (error); */
852 1.40 perseant }
853 1.134 perseant
854 1.303 dholland vrele(dvp);
855 1.273 hannken KASSERT(error == 0);
856 1.261 hannken VOP_UNLOCK(*vpp);
857 1.86 perseant return (0);
858 1.1 mycroft }
859 1.1 mycroft
860 1.265 dholland /*
861 1.265 dholland * Create a regular file
862 1.265 dholland */
863 1.265 dholland int
864 1.51 perseant lfs_create(void *v)
865 1.10 christos {
866 1.261 hannken struct vop_create_v3_args /* {
867 1.1 mycroft struct vnode *a_dvp;
868 1.1 mycroft struct vnode **a_vpp;
869 1.1 mycroft struct componentname *a_cnp;
870 1.1 mycroft struct vattr *a_vap;
871 1.10 christos } */ *ap = v;
872 1.264 dholland struct lfs *fs;
873 1.264 dholland struct vnode *dvp, **vpp;
874 1.268 dholland struct vattr *vap;
875 1.268 dholland struct ulfs_lookup_results *ulr;
876 1.37 perseant int error;
877 1.1 mycroft
878 1.264 dholland dvp = ap->a_dvp;
879 1.264 dholland vpp = ap->a_vpp;
880 1.268 dholland vap = ap->a_vap;
881 1.264 dholland
882 1.311 riastrad KASSERT(VOP_ISLOCKED(dvp) == LK_EXCLUSIVE);
883 1.264 dholland KASSERT(vpp != NULL);
884 1.264 dholland KASSERT(*vpp == NULL);
885 1.264 dholland
886 1.268 dholland /* XXX should handle this material another way */
887 1.268 dholland ulr = &VTOI(dvp)->i_crap;
888 1.268 dholland ULFS_CHECK_CRAPCOUNTER(VTOI(dvp));
889 1.268 dholland
890 1.264 dholland fs = VFSTOULFS(dvp->v_mount)->um_lfs;
891 1.264 dholland ASSERT_NO_SEGLOCK(fs);
892 1.264 dholland if (fs->lfs_ronly) {
893 1.264 dholland return EROFS;
894 1.264 dholland }
895 1.264 dholland
896 1.264 dholland error = lfs_set_dirop(dvp, NULL);
897 1.272 hannken if (error)
898 1.37 perseant return error;
899 1.264 dholland
900 1.300 dholland error = lfs_makeinode(vap, dvp, ulr, vpp, ap->a_cnp);
901 1.268 dholland if (error) {
902 1.268 dholland goto out;
903 1.268 dholland }
904 1.311 riastrad KASSERT(VOP_ISLOCKED(*vpp) == LK_EXCLUSIVE);
905 1.268 dholland VN_KNOTE(dvp, NOTE_WRITE);
906 1.268 dholland VOP_UNLOCK(*vpp);
907 1.268 dholland
908 1.268 dholland out:
909 1.264 dholland
910 1.264 dholland UNMARK_VNODE(dvp);
911 1.264 dholland UNMARK_VNODE(*vpp);
912 1.281 dholland if (error) {
913 1.264 dholland *vpp = NULL;
914 1.264 dholland }
915 1.264 dholland lfs_unset_dirop(fs, dvp, "create");
916 1.264 dholland
917 1.264 dholland vrele(dvp);
918 1.37 perseant return (error);
919 1.22 perseant }
920 1.22 perseant
921 1.22 perseant int
922 1.267 dholland lfs_mkdir(void *v)
923 1.265 dholland {
924 1.267 dholland struct vop_mkdir_v3_args /* {
925 1.267 dholland struct vnode *a_dvp;
926 1.267 dholland struct vnode **a_vpp;
927 1.267 dholland struct componentname *a_cnp;
928 1.267 dholland struct vattr *a_vap;
929 1.265 dholland } */ *ap = v;
930 1.267 dholland struct lfs *fs;
931 1.267 dholland struct vnode *dvp, *tvp, **vpp;
932 1.267 dholland struct inode *dp, *ip;
933 1.267 dholland struct componentname *cnp;
934 1.267 dholland struct vattr *vap;
935 1.265 dholland struct ulfs_lookup_results *ulr;
936 1.267 dholland struct buf *bp;
937 1.293 dholland LFS_DIRHEADER *dirp;
938 1.267 dholland int dirblksiz;
939 1.267 dholland int error;
940 1.265 dholland
941 1.267 dholland dvp = ap->a_dvp;
942 1.267 dholland tvp = NULL;
943 1.267 dholland vpp = ap->a_vpp;
944 1.267 dholland cnp = ap->a_cnp;
945 1.267 dholland vap = ap->a_vap;
946 1.267 dholland
947 1.311 riastrad KASSERT(VOP_ISLOCKED(dvp) == LK_EXCLUSIVE);
948 1.311 riastrad
949 1.267 dholland dp = VTOI(dvp);
950 1.267 dholland ip = NULL;
951 1.267 dholland
952 1.272 hannken KASSERT(vap->va_type == VDIR);
953 1.267 dholland KASSERT(vpp != NULL);
954 1.267 dholland KASSERT(*vpp == NULL);
955 1.265 dholland
956 1.265 dholland /* XXX should handle this material another way */
957 1.265 dholland ulr = &dp->i_crap;
958 1.265 dholland ULFS_CHECK_CRAPCOUNTER(dp);
959 1.265 dholland
960 1.267 dholland fs = VFSTOULFS(dvp->v_mount)->um_lfs;
961 1.267 dholland ASSERT_NO_SEGLOCK(fs);
962 1.267 dholland if (fs->lfs_ronly) {
963 1.267 dholland return EROFS;
964 1.267 dholland }
965 1.322 zafer
966 1.322 zafer if ((nlink_t)dp->i_nlink >= LINK_MAX) {
967 1.322 zafer return EMLINK;
968 1.322 zafer }
969 1.322 zafer
970 1.267 dholland dirblksiz = fs->um_dirblksiz;
971 1.291 dholland /* XXX dholland 20150911 I believe this to be true, but... */
972 1.291 dholland //KASSERT(dirblksiz == LFS_DIRBLKSIZ);
973 1.267 dholland
974 1.267 dholland error = lfs_set_dirop(dvp, NULL);
975 1.272 hannken if (error)
976 1.267 dholland return error;
977 1.267 dholland
978 1.265 dholland /*
979 1.300 dholland * Must simulate part of lfs_makeinode here to acquire the inode,
980 1.265 dholland * but not have it entered in the parent directory. The entry is
981 1.265 dholland * made later after writing "." and ".." entries.
982 1.265 dholland */
983 1.323 hannken error = vcache_new(dvp->v_mount, dvp, vap, cnp->cn_cred, NULL,
984 1.323 hannken ap->a_vpp);
985 1.272 hannken if (error)
986 1.272 hannken goto out;
987 1.272 hannken
988 1.272 hannken error = vn_lock(*ap->a_vpp, LK_EXCLUSIVE);
989 1.272 hannken if (error) {
990 1.272 hannken vrele(*ap->a_vpp);
991 1.272 hannken *ap->a_vpp = NULL;
992 1.265 dholland goto out;
993 1.272 hannken }
994 1.265 dholland
995 1.272 hannken tvp = *ap->a_vpp;
996 1.319 maya MARK_VNODE(tvp);
997 1.265 dholland ip = VTOI(tvp);
998 1.317 maya ip->i_state |= IN_ACCESS | IN_CHANGE | IN_UPDATE;
999 1.265 dholland ip->i_nlink = 2;
1000 1.265 dholland DIP_ASSIGN(ip, nlink, 2);
1001 1.265 dholland if (cnp->cn_flags & ISWHITEOUT) {
1002 1.265 dholland ip->i_flags |= UF_OPAQUE;
1003 1.265 dholland DIP_ASSIGN(ip, flags, ip->i_flags);
1004 1.265 dholland }
1005 1.265 dholland
1006 1.265 dholland /*
1007 1.265 dholland * Bump link count in parent directory to reflect work done below.
1008 1.265 dholland */
1009 1.265 dholland dp->i_nlink++;
1010 1.265 dholland DIP_ASSIGN(dp, nlink, dp->i_nlink);
1011 1.317 maya dp->i_state |= IN_CHANGE;
1012 1.265 dholland if ((error = lfs_update(dvp, NULL, NULL, UPDATE_DIROP)) != 0)
1013 1.265 dholland goto bad;
1014 1.265 dholland
1015 1.265 dholland /*
1016 1.291 dholland * Initialize directory with "." and "..". This used to use a
1017 1.291 dholland * static template but that adds moving parts for very little
1018 1.291 dholland * benefit.
1019 1.265 dholland */
1020 1.265 dholland if ((error = lfs_balloc(tvp, (off_t)0, dirblksiz, cnp->cn_cred,
1021 1.265 dholland B_CLRBUF, &bp)) != 0)
1022 1.265 dholland goto bad;
1023 1.265 dholland ip->i_size = dirblksiz;
1024 1.265 dholland DIP_ASSIGN(ip, size, dirblksiz);
1025 1.317 maya ip->i_state |= IN_ACCESS | IN_CHANGE | IN_UPDATE;
1026 1.265 dholland uvm_vnp_setsize(tvp, ip->i_size);
1027 1.291 dholland dirp = bp->b_data;
1028 1.291 dholland
1029 1.291 dholland /* . */
1030 1.291 dholland lfs_dir_setino(fs, dirp, ip->i_number);
1031 1.292 dholland lfs_dir_setreclen(fs, dirp, LFS_DIRECTSIZ(fs, 1));
1032 1.291 dholland lfs_dir_settype(fs, dirp, LFS_DT_DIR);
1033 1.291 dholland lfs_dir_setnamlen(fs, dirp, 1);
1034 1.291 dholland lfs_copydirname(fs, lfs_dir_nameptr(fs, dirp), ".", 1,
1035 1.292 dholland LFS_DIRECTSIZ(fs, 1));
1036 1.291 dholland dirp = LFS_NEXTDIR(fs, dirp);
1037 1.291 dholland /* .. */
1038 1.291 dholland lfs_dir_setino(fs, dirp, dp->i_number);
1039 1.292 dholland lfs_dir_setreclen(fs, dirp, dirblksiz - LFS_DIRECTSIZ(fs, 1));
1040 1.291 dholland lfs_dir_settype(fs, dirp, LFS_DT_DIR);
1041 1.291 dholland lfs_dir_setnamlen(fs, dirp, 2);
1042 1.291 dholland lfs_copydirname(fs, lfs_dir_nameptr(fs, dirp), "..", 2,
1043 1.292 dholland dirblksiz - LFS_DIRECTSIZ(fs, 1));
1044 1.265 dholland
1045 1.265 dholland /*
1046 1.267 dholland * Directory set up; now install its entry in the parent directory.
1047 1.265 dholland */
1048 1.265 dholland if ((error = VOP_BWRITE(bp->b_vp, bp)) != 0)
1049 1.265 dholland goto bad;
1050 1.265 dholland if ((error = lfs_update(tvp, NULL, NULL, UPDATE_DIROP)) != 0) {
1051 1.265 dholland goto bad;
1052 1.265 dholland }
1053 1.290 dholland error = ulfs_direnter(dvp, ulr, tvp,
1054 1.290 dholland cnp, ip->i_number, LFS_IFTODT(ip->i_mode), bp);
1055 1.265 dholland bad:
1056 1.265 dholland if (error == 0) {
1057 1.265 dholland VN_KNOTE(dvp, NOTE_WRITE | NOTE_LINK);
1058 1.265 dholland VOP_UNLOCK(tvp);
1059 1.265 dholland } else {
1060 1.265 dholland dp->i_nlink--;
1061 1.265 dholland DIP_ASSIGN(dp, nlink, dp->i_nlink);
1062 1.317 maya dp->i_state |= IN_CHANGE;
1063 1.265 dholland /*
1064 1.265 dholland * No need to do an explicit lfs_truncate here, vrele will
1065 1.265 dholland * do this for us because we set the link count to 0.
1066 1.265 dholland */
1067 1.265 dholland ip->i_nlink = 0;
1068 1.265 dholland DIP_ASSIGN(ip, nlink, 0);
1069 1.317 maya ip->i_state |= IN_CHANGE;
1070 1.265 dholland /* If IN_ADIROP, account for it */
1071 1.319 maya UNMARK_VNODE(tvp);
1072 1.265 dholland vput(tvp);
1073 1.265 dholland }
1074 1.267 dholland
1075 1.267 dholland out:
1076 1.264 dholland UNMARK_VNODE(dvp);
1077 1.264 dholland UNMARK_VNODE(*vpp);
1078 1.281 dholland if (error) {
1079 1.264 dholland *vpp = NULL;
1080 1.264 dholland }
1081 1.264 dholland lfs_unset_dirop(fs, dvp, "mkdir");
1082 1.264 dholland
1083 1.264 dholland vrele(dvp);
1084 1.37 perseant return (error);
1085 1.1 mycroft }
1086 1.1 mycroft
1087 1.1 mycroft int
1088 1.51 perseant lfs_remove(void *v)
1089 1.10 christos {
1090 1.314 riastrad struct vop_remove_v2_args /* {
1091 1.1 mycroft struct vnode *a_dvp;
1092 1.1 mycroft struct vnode *a_vp;
1093 1.1 mycroft struct componentname *a_cnp;
1094 1.10 christos } */ *ap = v;
1095 1.34 perseant struct vnode *dvp, *vp;
1096 1.188 perseant struct inode *ip;
1097 1.37 perseant int error;
1098 1.34 perseant
1099 1.34 perseant dvp = ap->a_dvp;
1100 1.34 perseant vp = ap->a_vp;
1101 1.311 riastrad
1102 1.311 riastrad KASSERT(VOP_ISLOCKED(dvp) == LK_EXCLUSIVE);
1103 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
1104 1.311 riastrad
1105 1.188 perseant ip = VTOI(vp);
1106 1.264 dholland if ((error = lfs_set_dirop(dvp, vp)) != 0) {
1107 1.34 perseant if (dvp == vp)
1108 1.34 perseant vrele(vp);
1109 1.34 perseant else
1110 1.34 perseant vput(vp);
1111 1.37 perseant return error;
1112 1.34 perseant }
1113 1.245 dholland error = ulfs_remove(ap);
1114 1.188 perseant if (ip->i_nlink == 0)
1115 1.188 perseant lfs_orphan(ip->i_lfs, ip->i_number);
1116 1.264 dholland
1117 1.264 dholland UNMARK_VNODE(dvp);
1118 1.264 dholland if (ap->a_vp) {
1119 1.264 dholland UNMARK_VNODE(ap->a_vp);
1120 1.264 dholland }
1121 1.264 dholland lfs_unset_dirop(ip->i_lfs, dvp, "remove");
1122 1.264 dholland vrele(dvp);
1123 1.264 dholland if (ap->a_vp) {
1124 1.264 dholland vrele(ap->a_vp);
1125 1.264 dholland }
1126 1.264 dholland
1127 1.37 perseant return (error);
1128 1.1 mycroft }
1129 1.1 mycroft
1130 1.1 mycroft int
1131 1.51 perseant lfs_rmdir(void *v)
1132 1.10 christos {
1133 1.314 riastrad struct vop_rmdir_v2_args /* {
1134 1.1 mycroft struct vnodeop_desc *a_desc;
1135 1.1 mycroft struct vnode *a_dvp;
1136 1.1 mycroft struct vnode *a_vp;
1137 1.1 mycroft struct componentname *a_cnp;
1138 1.10 christos } */ *ap = v;
1139 1.84 perseant struct vnode *vp;
1140 1.188 perseant struct inode *ip;
1141 1.37 perseant int error;
1142 1.1 mycroft
1143 1.84 perseant vp = ap->a_vp;
1144 1.311 riastrad
1145 1.311 riastrad KASSERT(VOP_ISLOCKED(ap->a_dvp) == LK_EXCLUSIVE);
1146 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
1147 1.311 riastrad
1148 1.188 perseant ip = VTOI(vp);
1149 1.264 dholland if ((error = lfs_set_dirop(ap->a_dvp, ap->a_vp)) != 0) {
1150 1.194 chs if (ap->a_dvp == vp)
1151 1.314 riastrad vrele(vp);
1152 1.194 chs else
1153 1.314 riastrad vput(vp);
1154 1.37 perseant return error;
1155 1.34 perseant }
1156 1.245 dholland error = ulfs_rmdir(ap);
1157 1.188 perseant if (ip->i_nlink == 0)
1158 1.188 perseant lfs_orphan(ip->i_lfs, ip->i_number);
1159 1.264 dholland
1160 1.264 dholland UNMARK_VNODE(ap->a_dvp);
1161 1.264 dholland if (ap->a_vp) {
1162 1.264 dholland UNMARK_VNODE(ap->a_vp);
1163 1.264 dholland }
1164 1.264 dholland lfs_unset_dirop(ip->i_lfs, ap->a_dvp, "rmdir");
1165 1.264 dholland vrele(ap->a_dvp);
1166 1.264 dholland if (ap->a_vp) {
1167 1.264 dholland vrele(ap->a_vp);
1168 1.264 dholland }
1169 1.264 dholland
1170 1.37 perseant return (error);
1171 1.1 mycroft }
1172 1.1 mycroft
1173 1.1 mycroft int
1174 1.51 perseant lfs_link(void *v)
1175 1.10 christos {
1176 1.271 riastrad struct vop_link_v2_args /* {
1177 1.9 mycroft struct vnode *a_dvp;
1178 1.1 mycroft struct vnode *a_vp;
1179 1.1 mycroft struct componentname *a_cnp;
1180 1.10 christos } */ *ap = v;
1181 1.264 dholland struct lfs *fs;
1182 1.265 dholland struct vnode *dvp;
1183 1.37 perseant int error;
1184 1.1 mycroft
1185 1.264 dholland dvp = ap->a_dvp;
1186 1.264 dholland
1187 1.311 riastrad KASSERT(VOP_ISLOCKED(dvp) == LK_EXCLUSIVE);
1188 1.311 riastrad
1189 1.264 dholland fs = VFSTOULFS(dvp->v_mount)->um_lfs;
1190 1.264 dholland ASSERT_NO_SEGLOCK(fs);
1191 1.264 dholland if (fs->lfs_ronly) {
1192 1.264 dholland return EROFS;
1193 1.264 dholland }
1194 1.264 dholland
1195 1.264 dholland error = lfs_set_dirop(dvp, NULL);
1196 1.264 dholland if (error) {
1197 1.37 perseant return error;
1198 1.34 perseant }
1199 1.264 dholland
1200 1.245 dholland error = ulfs_link(ap);
1201 1.264 dholland
1202 1.264 dholland UNMARK_VNODE(dvp);
1203 1.264 dholland lfs_unset_dirop(fs, dvp, "link");
1204 1.264 dholland vrele(dvp);
1205 1.264 dholland
1206 1.37 perseant return (error);
1207 1.1 mycroft }
1208 1.22 perseant
1209 1.1 mycroft /* XXX hack to avoid calling ITIMES in getattr */
1210 1.1 mycroft int
1211 1.51 perseant lfs_getattr(void *v)
1212 1.10 christos {
1213 1.1 mycroft struct vop_getattr_args /* {
1214 1.1 mycroft struct vnode *a_vp;
1215 1.1 mycroft struct vattr *a_vap;
1216 1.176 elad kauth_cred_t a_cred;
1217 1.10 christos } */ *ap = v;
1218 1.35 augustss struct vnode *vp = ap->a_vp;
1219 1.311 riastrad struct inode *ip;
1220 1.35 augustss struct vattr *vap = ap->a_vap;
1221 1.311 riastrad struct lfs *fs;
1222 1.311 riastrad
1223 1.311 riastrad KASSERT(VOP_ISLOCKED(vp));
1224 1.311 riastrad
1225 1.311 riastrad ip = VTOI(vp);
1226 1.311 riastrad fs = ip->i_lfs;
1227 1.251 dholland
1228 1.1 mycroft /*
1229 1.1 mycroft * Copy from inode table
1230 1.1 mycroft */
1231 1.1 mycroft vap->va_fsid = ip->i_dev;
1232 1.1 mycroft vap->va_fileid = ip->i_number;
1233 1.246 dholland vap->va_mode = ip->i_mode & ~LFS_IFMT;
1234 1.102 fvdl vap->va_nlink = ip->i_nlink;
1235 1.102 fvdl vap->va_uid = ip->i_uid;
1236 1.102 fvdl vap->va_gid = ip->i_gid;
1237 1.288 dholland switch (vp->v_type) {
1238 1.288 dholland case VBLK:
1239 1.288 dholland case VCHR:
1240 1.288 dholland vap->va_rdev = (dev_t)lfs_dino_getrdev(fs, ip->i_din);
1241 1.288 dholland break;
1242 1.288 dholland default:
1243 1.288 dholland vap->va_rdev = NODEV;
1244 1.288 dholland break;
1245 1.288 dholland }
1246 1.55 chs vap->va_size = vp->v_size;
1247 1.288 dholland vap->va_atime.tv_sec = lfs_dino_getatime(fs, ip->i_din);
1248 1.288 dholland vap->va_atime.tv_nsec = lfs_dino_getatimensec(fs, ip->i_din);
1249 1.288 dholland vap->va_mtime.tv_sec = lfs_dino_getmtime(fs, ip->i_din);
1250 1.288 dholland vap->va_mtime.tv_nsec = lfs_dino_getmtimensec(fs, ip->i_din);
1251 1.288 dholland vap->va_ctime.tv_sec = lfs_dino_getctime(fs, ip->i_din);
1252 1.288 dholland vap->va_ctime.tv_nsec = lfs_dino_getctimensec(fs, ip->i_din);
1253 1.102 fvdl vap->va_flags = ip->i_flags;
1254 1.102 fvdl vap->va_gen = ip->i_gen;
1255 1.1 mycroft /* this doesn't belong here */
1256 1.1 mycroft if (vp->v_type == VBLK)
1257 1.1 mycroft vap->va_blocksize = BLKDEV_IOSIZE;
1258 1.1 mycroft else if (vp->v_type == VCHR)
1259 1.1 mycroft vap->va_blocksize = MAXBSIZE;
1260 1.1 mycroft else
1261 1.1 mycroft vap->va_blocksize = vp->v_mount->mnt_stat.f_iosize;
1262 1.279 dholland vap->va_bytes = lfs_fsbtob(fs, ip->i_lfs_effnblks);
1263 1.1 mycroft vap->va_type = vp->v_type;
1264 1.1 mycroft vap->va_filerev = ip->i_modrev;
1265 1.1 mycroft return (0);
1266 1.61 perseant }
1267 1.61 perseant
1268 1.61 perseant /*
1269 1.61 perseant * Check to make sure the inode blocks won't choke the buffer
1270 1.245 dholland * cache, then call ulfs_setattr as usual.
1271 1.61 perseant */
1272 1.61 perseant int
1273 1.61 perseant lfs_setattr(void *v)
1274 1.61 perseant {
1275 1.149 skrll struct vop_setattr_args /* {
1276 1.61 perseant struct vnode *a_vp;
1277 1.61 perseant struct vattr *a_vap;
1278 1.176 elad kauth_cred_t a_cred;
1279 1.61 perseant } */ *ap = v;
1280 1.61 perseant struct vnode *vp = ap->a_vp;
1281 1.61 perseant
1282 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
1283 1.61 perseant lfs_check(vp, LFS_UNUSED_LBN, 0);
1284 1.245 dholland return ulfs_setattr(v);
1285 1.1 mycroft }
1286 1.22 perseant
1287 1.1 mycroft /*
1288 1.179 perseant * Release the block we hold on lfs_newseg wrapping. Called on file close,
1289 1.188 perseant * or explicitly from LFCNWRAPGO. Called with the interlock held.
1290 1.179 perseant */
1291 1.179 perseant static int
1292 1.193 christos lfs_wrapgo(struct lfs *fs, struct inode *ip, int waitfor)
1293 1.179 perseant {
1294 1.214 ad if (fs->lfs_stoplwp != curlwp)
1295 1.179 perseant return EBUSY;
1296 1.179 perseant
1297 1.214 ad fs->lfs_stoplwp = NULL;
1298 1.214 ad cv_signal(&fs->lfs_stopcv);
1299 1.179 perseant
1300 1.179 perseant KASSERT(fs->lfs_nowrap > 0);
1301 1.179 perseant if (fs->lfs_nowrap <= 0) {
1302 1.179 perseant return 0;
1303 1.179 perseant }
1304 1.179 perseant
1305 1.179 perseant if (--fs->lfs_nowrap == 0) {
1306 1.275 dholland log(LOG_NOTICE, "%s: re-enabled log wrap\n",
1307 1.275 dholland lfs_sb_getfsmnt(fs));
1308 1.188 perseant wakeup(&fs->lfs_wrappass);
1309 1.180 perseant lfs_wakeup_cleaner(fs);
1310 1.179 perseant }
1311 1.179 perseant if (waitfor) {
1312 1.318 maya cv_wait_sig(&fs->lfs_nextsegsleep, &lfs_lock);
1313 1.179 perseant }
1314 1.179 perseant
1315 1.179 perseant return 0;
1316 1.179 perseant }
1317 1.179 perseant
1318 1.179 perseant /*
1319 1.251 dholland * Close called.
1320 1.251 dholland *
1321 1.251 dholland * Update the times on the inode.
1322 1.1 mycroft */
1323 1.1 mycroft /* ARGSUSED */
1324 1.1 mycroft int
1325 1.51 perseant lfs_close(void *v)
1326 1.10 christos {
1327 1.1 mycroft struct vop_close_args /* {
1328 1.1 mycroft struct vnode *a_vp;
1329 1.1 mycroft int a_fflag;
1330 1.176 elad kauth_cred_t a_cred;
1331 1.10 christos } */ *ap = v;
1332 1.35 augustss struct vnode *vp = ap->a_vp;
1333 1.311 riastrad struct inode *ip;
1334 1.311 riastrad struct lfs *fs;
1335 1.311 riastrad
1336 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
1337 1.311 riastrad
1338 1.311 riastrad ip = VTOI(vp);
1339 1.311 riastrad fs = ip->i_lfs;
1340 1.1 mycroft
1341 1.245 dholland if ((ip->i_number == ULFS_ROOTINO || ip->i_number == LFS_IFILE_INUM) &&
1342 1.214 ad fs->lfs_stoplwp == curlwp) {
1343 1.214 ad mutex_enter(&lfs_lock);
1344 1.188 perseant log(LOG_NOTICE, "lfs_close: releasing log wrap control\n");
1345 1.180 perseant lfs_wrapgo(fs, ip, 0);
1346 1.214 ad mutex_exit(&lfs_lock);
1347 1.179 perseant }
1348 1.179 perseant
1349 1.97 perseant if (vp == ip->i_lfs->lfs_ivnode &&
1350 1.119 dbj vp->v_mount->mnt_iflag & IMNT_UNMOUNT)
1351 1.97 perseant return 0;
1352 1.97 perseant
1353 1.332 ad if (vrefcnt(vp) > 1 && vp != ip->i_lfs->lfs_ivnode) {
1354 1.154 christos LFS_ITIMES(ip, NULL, NULL, NULL);
1355 1.1 mycroft }
1356 1.1 mycroft return (0);
1357 1.65 perseant }
1358 1.65 perseant
1359 1.65 perseant /*
1360 1.65 perseant * Close wrapper for special devices.
1361 1.65 perseant *
1362 1.65 perseant * Update the times on the inode then do device close.
1363 1.65 perseant */
1364 1.65 perseant int
1365 1.65 perseant lfsspec_close(void *v)
1366 1.65 perseant {
1367 1.65 perseant struct vop_close_args /* {
1368 1.65 perseant struct vnode *a_vp;
1369 1.65 perseant int a_fflag;
1370 1.176 elad kauth_cred_t a_cred;
1371 1.65 perseant } */ *ap = v;
1372 1.65 perseant struct vnode *vp;
1373 1.65 perseant struct inode *ip;
1374 1.65 perseant
1375 1.65 perseant vp = ap->a_vp;
1376 1.311 riastrad
1377 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
1378 1.311 riastrad
1379 1.65 perseant ip = VTOI(vp);
1380 1.332 ad if (vrefcnt(vp) > 1) {
1381 1.154 christos LFS_ITIMES(ip, NULL, NULL, NULL);
1382 1.65 perseant }
1383 1.65 perseant return (VOCALL (spec_vnodeop_p, VOFFSET(vop_close), ap));
1384 1.65 perseant }
1385 1.65 perseant
1386 1.65 perseant /*
1387 1.65 perseant * Close wrapper for fifo's.
1388 1.65 perseant *
1389 1.65 perseant * Update the times on the inode then do device close.
1390 1.65 perseant */
1391 1.65 perseant int
1392 1.65 perseant lfsfifo_close(void *v)
1393 1.65 perseant {
1394 1.65 perseant struct vop_close_args /* {
1395 1.65 perseant struct vnode *a_vp;
1396 1.65 perseant int a_fflag;
1397 1.176 elad kauth_cred_ a_cred;
1398 1.65 perseant } */ *ap = v;
1399 1.65 perseant struct vnode *vp;
1400 1.65 perseant struct inode *ip;
1401 1.65 perseant
1402 1.65 perseant vp = ap->a_vp;
1403 1.311 riastrad
1404 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
1405 1.311 riastrad
1406 1.65 perseant ip = VTOI(vp);
1407 1.332 ad if (vrefcnt(ap->a_vp) > 1) {
1408 1.154 christos LFS_ITIMES(ip, NULL, NULL, NULL);
1409 1.65 perseant }
1410 1.65 perseant return (VOCALL (fifo_vnodeop_p, VOFFSET(vop_close), ap));
1411 1.1 mycroft }
1412 1.1 mycroft
1413 1.1 mycroft /*
1414 1.15 fvdl * Reclaim an inode so that it can be used for other purposes.
1415 1.1 mycroft */
1416 1.1 mycroft
1417 1.1 mycroft int
1418 1.51 perseant lfs_reclaim(void *v)
1419 1.10 christos {
1420 1.315 riastrad struct vop_reclaim_v2_args /* {
1421 1.1 mycroft struct vnode *a_vp;
1422 1.10 christos } */ *ap = v;
1423 1.15 fvdl struct vnode *vp = ap->a_vp;
1424 1.311 riastrad struct inode *ip;
1425 1.311 riastrad struct lfs *fs;
1426 1.1 mycroft int error;
1427 1.77 yamt
1428 1.315 riastrad VOP_UNLOCK(vp);
1429 1.315 riastrad
1430 1.311 riastrad ip = VTOI(vp);
1431 1.311 riastrad fs = ip->i_lfs;
1432 1.311 riastrad
1433 1.231 hannken /*
1434 1.231 hannken * The inode must be freed and updated before being removed
1435 1.231 hannken * from its hash chain. Other threads trying to gain a hold
1436 1.262 hannken * or lock on the inode will be stalled.
1437 1.231 hannken */
1438 1.231 hannken if (ip->i_nlink <= 0 && (vp->v_mount->mnt_flag & MNT_RDONLY) == 0)
1439 1.231 hannken lfs_vfree(vp, ip->i_number, ip->i_omode);
1440 1.231 hannken
1441 1.214 ad mutex_enter(&lfs_lock);
1442 1.84 perseant LFS_CLR_UINO(ip, IN_ALLMOD);
1443 1.214 ad mutex_exit(&lfs_lock);
1444 1.245 dholland if ((error = ulfs_reclaim(vp)))
1445 1.1 mycroft return (error);
1446 1.203 perseant
1447 1.203 perseant /*
1448 1.203 perseant * Take us off the paging and/or dirop queues if we were on them.
1449 1.203 perseant * We shouldn't be on them.
1450 1.203 perseant */
1451 1.214 ad mutex_enter(&lfs_lock);
1452 1.317 maya if (ip->i_state & IN_PAGING) {
1453 1.203 perseant log(LOG_WARNING, "%s: reclaimed vnode is IN_PAGING\n",
1454 1.275 dholland lfs_sb_getfsmnt(fs));
1455 1.317 maya ip->i_state &= ~IN_PAGING;
1456 1.203 perseant TAILQ_REMOVE(&fs->lfs_pchainhd, ip, i_lfs_pchain);
1457 1.203 perseant }
1458 1.320 maya if (vp->v_uflag & VU_DIROP)
1459 1.212 ad panic("reclaimed vnode is VU_DIROP");
1460 1.214 ad mutex_exit(&lfs_lock);
1461 1.203 perseant
1462 1.287 dholland pool_put(&lfs_dinode_pool, ip->i_din);
1463 1.145 perseant lfs_deregister_all(vp);
1464 1.84 perseant pool_put(&lfs_inoext_pool, ip->inode_ext.lfs);
1465 1.84 perseant ip->inode_ext.lfs = NULL;
1466 1.199 ad genfs_node_destroy(vp);
1467 1.19 thorpej pool_put(&lfs_inode_pool, vp->v_data);
1468 1.1 mycroft vp->v_data = NULL;
1469 1.94 perseant return (0);
1470 1.94 perseant }
1471 1.94 perseant
1472 1.94 perseant /*
1473 1.101 yamt * Read a block from a storage device.
1474 1.251 dholland *
1475 1.251 dholland * Calculate the logical to physical mapping if not done already,
1476 1.251 dholland * then call the device strategy routine.
1477 1.251 dholland *
1478 1.94 perseant * In order to avoid reading blocks that are in the process of being
1479 1.94 perseant * written by the cleaner---and hence are not mutexed by the normal
1480 1.94 perseant * buffer cache / page cache mechanisms---check for collisions before
1481 1.94 perseant * reading.
1482 1.94 perseant *
1483 1.245 dholland * We inline ulfs_strategy to make sure that the VOP_BMAP occurs *before*
1484 1.94 perseant * the active cleaner test.
1485 1.94 perseant *
1486 1.94 perseant * XXX This code assumes that lfs_markv makes synchronous checkpoints.
1487 1.94 perseant */
1488 1.94 perseant int
1489 1.94 perseant lfs_strategy(void *v)
1490 1.94 perseant {
1491 1.94 perseant struct vop_strategy_args /* {
1492 1.128 hannken struct vnode *a_vp;
1493 1.94 perseant struct buf *a_bp;
1494 1.94 perseant } */ *ap = v;
1495 1.94 perseant struct buf *bp;
1496 1.94 perseant struct lfs *fs;
1497 1.94 perseant struct vnode *vp;
1498 1.94 perseant struct inode *ip;
1499 1.94 perseant daddr_t tbn;
1500 1.239 perseant #define MAXLOOP 25
1501 1.239 perseant int i, sn, error, slept, loopcount;
1502 1.94 perseant
1503 1.94 perseant bp = ap->a_bp;
1504 1.128 hannken vp = ap->a_vp;
1505 1.94 perseant ip = VTOI(vp);
1506 1.94 perseant fs = ip->i_lfs;
1507 1.94 perseant
1508 1.101 yamt /* lfs uses its strategy routine only for read */
1509 1.101 yamt KASSERT(bp->b_flags & B_READ);
1510 1.101 yamt
1511 1.94 perseant if (vp->v_type == VBLK || vp->v_type == VCHR)
1512 1.94 perseant panic("lfs_strategy: spec");
1513 1.94 perseant KASSERT(bp->b_bcount != 0);
1514 1.94 perseant if (bp->b_blkno == bp->b_lblkno) {
1515 1.94 perseant error = VOP_BMAP(vp, bp->b_lblkno, NULL, &bp->b_blkno,
1516 1.94 perseant NULL);
1517 1.94 perseant if (error) {
1518 1.94 perseant bp->b_error = error;
1519 1.214 ad bp->b_resid = bp->b_bcount;
1520 1.94 perseant biodone(bp);
1521 1.94 perseant return (error);
1522 1.94 perseant }
1523 1.94 perseant if ((long)bp->b_blkno == -1) /* no valid data */
1524 1.94 perseant clrbuf(bp);
1525 1.94 perseant }
1526 1.94 perseant if ((long)bp->b_blkno < 0) { /* block is not on disk */
1527 1.214 ad bp->b_resid = bp->b_bcount;
1528 1.94 perseant biodone(bp);
1529 1.94 perseant return (0);
1530 1.94 perseant }
1531 1.94 perseant
1532 1.94 perseant slept = 1;
1533 1.239 perseant loopcount = 0;
1534 1.214 ad mutex_enter(&lfs_lock);
1535 1.101 yamt while (slept && fs->lfs_seglock) {
1536 1.214 ad mutex_exit(&lfs_lock);
1537 1.94 perseant /*
1538 1.94 perseant * Look through list of intervals.
1539 1.94 perseant * There will only be intervals to look through
1540 1.94 perseant * if the cleaner holds the seglock.
1541 1.94 perseant * Since the cleaner is synchronous, we can trust
1542 1.94 perseant * the list of intervals to be current.
1543 1.94 perseant */
1544 1.248 christos tbn = LFS_DBTOFSB(fs, bp->b_blkno);
1545 1.248 christos sn = lfs_dtosn(fs, tbn);
1546 1.94 perseant slept = 0;
1547 1.94 perseant for (i = 0; i < fs->lfs_cleanind; i++) {
1548 1.248 christos if (sn == lfs_dtosn(fs, fs->lfs_cleanint[i]) &&
1549 1.94 perseant tbn >= fs->lfs_cleanint[i]) {
1550 1.136 perseant DLOG((DLOG_CLEAN,
1551 1.306 maya "lfs_strategy: ino %llu lbn %" PRId64
1552 1.280 dholland " ind %d sn %d fsb %" PRIx64
1553 1.203 perseant " given sn %d fsb %" PRIx64 "\n",
1554 1.306 maya (unsigned long long) ip->i_number,
1555 1.306 maya bp->b_lblkno, i,
1556 1.248 christos lfs_dtosn(fs, fs->lfs_cleanint[i]),
1557 1.203 perseant fs->lfs_cleanint[i], sn, tbn));
1558 1.136 perseant DLOG((DLOG_CLEAN,
1559 1.306 maya "lfs_strategy: sleeping on ino %llu lbn %"
1560 1.306 maya PRId64 "\n",
1561 1.306 maya (unsigned long long) ip->i_number,
1562 1.306 maya bp->b_lblkno));
1563 1.214 ad mutex_enter(&lfs_lock);
1564 1.170 perseant if (LFS_SEGLOCK_HELD(fs) && fs->lfs_iocount) {
1565 1.239 perseant /*
1566 1.239 perseant * Cleaner can't wait for itself.
1567 1.239 perseant * Instead, wait for the blocks
1568 1.239 perseant * to be written to disk.
1569 1.239 perseant * XXX we need pribio in the test
1570 1.239 perseant * XXX here.
1571 1.239 perseant */
1572 1.239 perseant mtsleep(&fs->lfs_iocount,
1573 1.239 perseant (PRIBIO + 1) | PNORELOCK,
1574 1.239 perseant "clean2", hz/10 + 1,
1575 1.239 perseant &lfs_lock);
1576 1.170 perseant slept = 1;
1577 1.239 perseant ++loopcount;
1578 1.170 perseant break;
1579 1.170 perseant } else if (fs->lfs_seglock) {
1580 1.214 ad mtsleep(&fs->lfs_seglock,
1581 1.141 perseant (PRIBIO + 1) | PNORELOCK,
1582 1.170 perseant "clean1", 0,
1583 1.214 ad &lfs_lock);
1584 1.167 perseant slept = 1;
1585 1.167 perseant break;
1586 1.167 perseant }
1587 1.214 ad mutex_exit(&lfs_lock);
1588 1.94 perseant }
1589 1.94 perseant }
1590 1.214 ad mutex_enter(&lfs_lock);
1591 1.239 perseant if (loopcount > MAXLOOP) {
1592 1.239 perseant printf("lfs_strategy: breaking out of clean2 loop\n");
1593 1.239 perseant break;
1594 1.239 perseant }
1595 1.94 perseant }
1596 1.214 ad mutex_exit(&lfs_lock);
1597 1.94 perseant
1598 1.94 perseant vp = ip->i_devvp;
1599 1.251 dholland return VOP_STRATEGY(vp, bp);
1600 1.89 perseant }
1601 1.89 perseant
1602 1.239 perseant /*
1603 1.239 perseant * Inline lfs_segwrite/lfs_writevnodes, but just for dirops.
1604 1.239 perseant * Technically this is a checkpoint (the on-disk state is valid)
1605 1.239 perseant * even though we are leaving out all the file data.
1606 1.239 perseant */
1607 1.239 perseant int
1608 1.92 perseant lfs_flush_dirops(struct lfs *fs)
1609 1.92 perseant {
1610 1.326 riastrad struct inode *ip, *marker;
1611 1.92 perseant struct vnode *vp;
1612 1.285 dholland extern int lfs_dostats; /* XXX this does not belong here */
1613 1.92 perseant struct segment *sp;
1614 1.285 dholland SEGSUM *ssp;
1615 1.239 perseant int flags = 0;
1616 1.239 perseant int error = 0;
1617 1.92 perseant
1618 1.163 perseant ASSERT_MAYBE_SEGLOCK(fs);
1619 1.327 riastrad KASSERT(fs->lfs_nadirop == 0); /* stable during lfs_writer */
1620 1.327 riastrad KASSERT(fs->lfs_dirops == 0); /* stable during lfs_writer */
1621 1.141 perseant
1622 1.92 perseant if (fs->lfs_ronly)
1623 1.239 perseant return EROFS;
1624 1.92 perseant
1625 1.214 ad mutex_enter(&lfs_lock);
1626 1.141 perseant if (TAILQ_FIRST(&fs->lfs_dchainhd) == NULL) {
1627 1.214 ad mutex_exit(&lfs_lock);
1628 1.239 perseant return 0;
1629 1.141 perseant } else
1630 1.214 ad mutex_exit(&lfs_lock);
1631 1.92 perseant
1632 1.92 perseant if (lfs_dostats)
1633 1.92 perseant ++lfs_stats.flush_invoked;
1634 1.92 perseant
1635 1.326 riastrad marker = pool_get(&lfs_inode_pool, PR_WAITOK);
1636 1.326 riastrad memset(marker, 0, sizeof(*marker));
1637 1.326 riastrad marker->inode_ext.lfs = pool_get(&lfs_inoext_pool, PR_WAITOK);
1638 1.326 riastrad memset(marker->inode_ext.lfs, 0, sizeof(*marker->inode_ext.lfs));
1639 1.326 riastrad marker->i_state = IN_MARKER;
1640 1.326 riastrad
1641 1.92 perseant lfs_imtime(fs);
1642 1.239 perseant lfs_seglock(fs, flags);
1643 1.92 perseant sp = fs->lfs_sp;
1644 1.92 perseant
1645 1.92 perseant /*
1646 1.92 perseant * lfs_writevnodes, optimized to get dirops out of the way.
1647 1.92 perseant * Only write dirops, and don't flush files' pages, only
1648 1.92 perseant * blocks from the directories.
1649 1.92 perseant *
1650 1.92 perseant * We don't need to vref these files because they are
1651 1.92 perseant * dirops and so hold an extra reference until the
1652 1.92 perseant * segunlock clears them of that status.
1653 1.92 perseant *
1654 1.92 perseant * We don't need to check for IN_ADIROP because we know that
1655 1.92 perseant * no dirops are active.
1656 1.92 perseant *
1657 1.92 perseant */
1658 1.214 ad mutex_enter(&lfs_lock);
1659 1.327 riastrad KASSERT(fs->lfs_writer);
1660 1.326 riastrad TAILQ_INSERT_HEAD(&fs->lfs_dchainhd, marker, i_lfs_dchain);
1661 1.326 riastrad while ((ip = TAILQ_NEXT(marker, i_lfs_dchain)) != NULL) {
1662 1.326 riastrad TAILQ_REMOVE(&fs->lfs_dchainhd, marker, i_lfs_dchain);
1663 1.326 riastrad TAILQ_INSERT_AFTER(&fs->lfs_dchainhd, ip, marker,
1664 1.326 riastrad i_lfs_dchain);
1665 1.330 riastrad if (ip->i_state & IN_MARKER)
1666 1.326 riastrad continue;
1667 1.92 perseant vp = ITOV(ip);
1668 1.92 perseant
1669 1.329 riastrad /*
1670 1.329 riastrad * Prevent the vnode from going away if it's just been
1671 1.329 riastrad * put out in the segment and lfs_unmark_dirop is about
1672 1.329 riastrad * to release it. While it is on the list it is always
1673 1.329 riastrad * referenced, so it cannot be reclaimed until we
1674 1.329 riastrad * release it.
1675 1.329 riastrad */
1676 1.329 riastrad vref(vp);
1677 1.329 riastrad
1678 1.329 riastrad /*
1679 1.329 riastrad * Since we hold lfs_writer, the node can't be in an
1680 1.329 riastrad * active dirop. Since it's on the list and we hold a
1681 1.329 riastrad * reference to it, it can't be reclaimed now.
1682 1.329 riastrad */
1683 1.317 maya KASSERT((ip->i_state & IN_ADIROP) == 0);
1684 1.239 perseant KASSERT(vp->v_uflag & VU_DIROP);
1685 1.329 riastrad
1686 1.329 riastrad /*
1687 1.329 riastrad * After we release lfs_lock, if we were in the middle
1688 1.329 riastrad * of writing a segment, lfs_unmark_dirop may end up
1689 1.329 riastrad * clearing VU_DIROP, and we have no way to stop it.
1690 1.329 riastrad * That should be OK -- we'll just have less to do
1691 1.329 riastrad * here.
1692 1.329 riastrad */
1693 1.329 riastrad mutex_exit(&lfs_lock);
1694 1.171 perseant
1695 1.92 perseant /*
1696 1.92 perseant * All writes to directories come from dirops; all
1697 1.92 perseant * writes to files' direct blocks go through the page
1698 1.92 perseant * cache, which we're not touching. Reads to files
1699 1.92 perseant * and/or directories will not be affected by writing
1700 1.92 perseant * directory blocks inodes and file inodes. So we don't
1701 1.239 perseant * really need to lock.
1702 1.92 perseant */
1703 1.92 perseant if (vp->v_type != VREG &&
1704 1.317 maya ((ip->i_state & IN_ALLMOD) || !VPISEMPTY(vp))) {
1705 1.239 perseant error = lfs_writefile(fs, sp, vp);
1706 1.92 perseant if (!VPISEMPTY(vp) && !WRITEINPROG(vp) &&
1707 1.317 maya !(ip->i_state & IN_ALLMOD)) {
1708 1.214 ad mutex_enter(&lfs_lock);
1709 1.92 perseant LFS_SET_UINO(ip, IN_MODIFIED);
1710 1.214 ad mutex_exit(&lfs_lock);
1711 1.92 perseant }
1712 1.239 perseant if (error && (sp->seg_flags & SEGM_SINGLE)) {
1713 1.329 riastrad vrele(vp);
1714 1.239 perseant mutex_enter(&lfs_lock);
1715 1.239 perseant error = EAGAIN;
1716 1.239 perseant break;
1717 1.239 perseant }
1718 1.92 perseant }
1719 1.328 riastrad KASSERT(ip->i_number != LFS_IFILE_INUM);
1720 1.239 perseant error = lfs_writeinode(fs, sp, ip);
1721 1.239 perseant if (error && (sp->seg_flags & SEGM_SINGLE)) {
1722 1.329 riastrad vrele(vp);
1723 1.329 riastrad mutex_enter(&lfs_lock);
1724 1.239 perseant error = EAGAIN;
1725 1.239 perseant break;
1726 1.239 perseant }
1727 1.239 perseant
1728 1.228 hannken /*
1729 1.239 perseant * We might need to update these inodes again,
1730 1.239 perseant * for example, if they have data blocks to write.
1731 1.239 perseant * Make sure that after this flush, they are still
1732 1.239 perseant * marked IN_MODIFIED so that we don't forget to
1733 1.239 perseant * write them.
1734 1.228 hannken */
1735 1.239 perseant /* XXX only for non-directories? --KS */
1736 1.329 riastrad mutex_enter(&lfs_lock);
1737 1.239 perseant LFS_SET_UINO(ip, IN_MODIFIED);
1738 1.329 riastrad mutex_exit(&lfs_lock);
1739 1.329 riastrad
1740 1.329 riastrad vrele(vp);
1741 1.329 riastrad mutex_enter(&lfs_lock);
1742 1.92 perseant }
1743 1.326 riastrad TAILQ_REMOVE(&fs->lfs_dchainhd, marker, i_lfs_dchain);
1744 1.214 ad mutex_exit(&lfs_lock);
1745 1.326 riastrad
1746 1.92 perseant /* We've written all the dirops there are */
1747 1.285 dholland ssp = (SEGSUM *)sp->segsum;
1748 1.285 dholland lfs_ss_setflags(fs, ssp, lfs_ss_getflags(fs, ssp) & ~(SS_CONT));
1749 1.170 perseant lfs_finalize_fs_seguse(fs);
1750 1.92 perseant (void) lfs_writeseg(fs, sp);
1751 1.92 perseant lfs_segunlock(fs);
1752 1.239 perseant
1753 1.326 riastrad pool_put(&lfs_inoext_pool, marker->inode_ext.lfs);
1754 1.326 riastrad pool_put(&lfs_inode_pool, marker);
1755 1.326 riastrad
1756 1.239 perseant return error;
1757 1.92 perseant }
1758 1.92 perseant
1759 1.89 perseant /*
1760 1.164 perseant * Flush all vnodes for which the pagedaemon has requested pageouts.
1761 1.212 ad * Skip over any files that are marked VU_DIROP (since lfs_flush_dirop()
1762 1.164 perseant * has just run, this would be an error). If we have to skip a vnode
1763 1.164 perseant * for any reason, just skip it; if we have to wait for the cleaner,
1764 1.164 perseant * abort. The writer daemon will call us again later.
1765 1.164 perseant */
1766 1.239 perseant int
1767 1.164 perseant lfs_flush_pchain(struct lfs *fs)
1768 1.164 perseant {
1769 1.164 perseant struct inode *ip, *nip;
1770 1.164 perseant struct vnode *vp;
1771 1.164 perseant extern int lfs_dostats;
1772 1.164 perseant struct segment *sp;
1773 1.239 perseant int error, error2;
1774 1.164 perseant
1775 1.164 perseant ASSERT_NO_SEGLOCK(fs);
1776 1.327 riastrad KASSERT(fs->lfs_writer);
1777 1.164 perseant
1778 1.164 perseant if (fs->lfs_ronly)
1779 1.239 perseant return EROFS;
1780 1.164 perseant
1781 1.214 ad mutex_enter(&lfs_lock);
1782 1.164 perseant if (TAILQ_FIRST(&fs->lfs_pchainhd) == NULL) {
1783 1.214 ad mutex_exit(&lfs_lock);
1784 1.239 perseant return 0;
1785 1.164 perseant } else
1786 1.214 ad mutex_exit(&lfs_lock);
1787 1.164 perseant
1788 1.164 perseant /* Get dirops out of the way */
1789 1.239 perseant if ((error = lfs_flush_dirops(fs)) != 0)
1790 1.239 perseant return error;
1791 1.164 perseant
1792 1.164 perseant if (lfs_dostats)
1793 1.164 perseant ++lfs_stats.flush_invoked;
1794 1.164 perseant
1795 1.164 perseant /*
1796 1.164 perseant * Inline lfs_segwrite/lfs_writevnodes, but just for pageouts.
1797 1.164 perseant */
1798 1.164 perseant lfs_imtime(fs);
1799 1.164 perseant lfs_seglock(fs, 0);
1800 1.164 perseant sp = fs->lfs_sp;
1801 1.164 perseant
1802 1.164 perseant /*
1803 1.164 perseant * lfs_writevnodes, optimized to clear pageout requests.
1804 1.164 perseant * Only write non-dirop files that are in the pageout queue.
1805 1.164 perseant * We're very conservative about what we write; we want to be
1806 1.164 perseant * fast and async.
1807 1.164 perseant */
1808 1.214 ad mutex_enter(&lfs_lock);
1809 1.214 ad top:
1810 1.164 perseant for (ip = TAILQ_FIRST(&fs->lfs_pchainhd); ip != NULL; ip = nip) {
1811 1.277 hannken struct mount *mp = ITOV(ip)->v_mount;
1812 1.277 hannken ino_t ino = ip->i_number;
1813 1.277 hannken
1814 1.164 perseant nip = TAILQ_NEXT(ip, i_lfs_pchain);
1815 1.164 perseant
1816 1.317 maya if (!(ip->i_state & IN_PAGING))
1817 1.164 perseant goto top;
1818 1.164 perseant
1819 1.277 hannken mutex_exit(&lfs_lock);
1820 1.277 hannken if (vcache_get(mp, &ino, sizeof(ino), &vp) != 0) {
1821 1.277 hannken mutex_enter(&lfs_lock);
1822 1.164 perseant continue;
1823 1.277 hannken };
1824 1.277 hannken if (vn_lock(vp, LK_EXCLUSIVE | LK_NOWAIT) != 0) {
1825 1.277 hannken vrele(vp);
1826 1.277 hannken mutex_enter(&lfs_lock);
1827 1.164 perseant continue;
1828 1.214 ad }
1829 1.277 hannken ip = VTOI(vp);
1830 1.277 hannken mutex_enter(&lfs_lock);
1831 1.277 hannken if ((vp->v_uflag & VU_DIROP) != 0 || vp->v_type != VREG ||
1832 1.317 maya !(ip->i_state & IN_PAGING)) {
1833 1.277 hannken mutex_exit(&lfs_lock);
1834 1.277 hannken vput(vp);
1835 1.214 ad mutex_enter(&lfs_lock);
1836 1.277 hannken goto top;
1837 1.165 perseant }
1838 1.277 hannken mutex_exit(&lfs_lock);
1839 1.164 perseant
1840 1.164 perseant error = lfs_writefile(fs, sp, vp);
1841 1.164 perseant if (!VPISEMPTY(vp) && !WRITEINPROG(vp) &&
1842 1.317 maya !(ip->i_state & IN_ALLMOD)) {
1843 1.214 ad mutex_enter(&lfs_lock);
1844 1.164 perseant LFS_SET_UINO(ip, IN_MODIFIED);
1845 1.214 ad mutex_exit(&lfs_lock);
1846 1.164 perseant }
1847 1.328 riastrad KASSERT(ip->i_number != LFS_IFILE_INUM);
1848 1.239 perseant error2 = lfs_writeinode(fs, sp, ip);
1849 1.164 perseant
1850 1.229 hannken VOP_UNLOCK(vp);
1851 1.272 hannken vrele(vp);
1852 1.164 perseant
1853 1.239 perseant if (error == EAGAIN || error2 == EAGAIN) {
1854 1.164 perseant lfs_writeseg(fs, sp);
1855 1.214 ad mutex_enter(&lfs_lock);
1856 1.164 perseant break;
1857 1.164 perseant }
1858 1.214 ad mutex_enter(&lfs_lock);
1859 1.164 perseant }
1860 1.214 ad mutex_exit(&lfs_lock);
1861 1.164 perseant (void) lfs_writeseg(fs, sp);
1862 1.164 perseant lfs_segunlock(fs);
1863 1.239 perseant
1864 1.239 perseant return 0;
1865 1.164 perseant }
1866 1.164 perseant
1867 1.164 perseant /*
1868 1.283 dholland * Conversion for compat.
1869 1.283 dholland */
1870 1.283 dholland static void
1871 1.283 dholland block_info_from_70(BLOCK_INFO *bi, const BLOCK_INFO_70 *bi70)
1872 1.283 dholland {
1873 1.283 dholland bi->bi_inode = bi70->bi_inode;
1874 1.283 dholland bi->bi_lbn = bi70->bi_lbn;
1875 1.283 dholland bi->bi_daddr = bi70->bi_daddr;
1876 1.283 dholland bi->bi_segcreate = bi70->bi_segcreate;
1877 1.283 dholland bi->bi_version = bi70->bi_version;
1878 1.283 dholland bi->bi_bp = bi70->bi_bp;
1879 1.283 dholland bi->bi_size = bi70->bi_size;
1880 1.283 dholland }
1881 1.283 dholland
1882 1.283 dholland static void
1883 1.283 dholland block_info_to_70(BLOCK_INFO_70 *bi70, const BLOCK_INFO *bi)
1884 1.283 dholland {
1885 1.283 dholland bi70->bi_inode = bi->bi_inode;
1886 1.283 dholland bi70->bi_lbn = bi->bi_lbn;
1887 1.283 dholland bi70->bi_daddr = bi->bi_daddr;
1888 1.283 dholland bi70->bi_segcreate = bi->bi_segcreate;
1889 1.283 dholland bi70->bi_version = bi->bi_version;
1890 1.283 dholland bi70->bi_bp = bi->bi_bp;
1891 1.283 dholland bi70->bi_size = bi->bi_size;
1892 1.283 dholland }
1893 1.283 dholland
1894 1.283 dholland /*
1895 1.90 perseant * Provide a fcntl interface to sys_lfs_{segwait,bmapv,markv}.
1896 1.89 perseant */
1897 1.89 perseant int
1898 1.90 perseant lfs_fcntl(void *v)
1899 1.89 perseant {
1900 1.137 simonb struct vop_fcntl_args /* {
1901 1.137 simonb struct vnode *a_vp;
1902 1.218 gmcgarry u_int a_command;
1903 1.201 christos void * a_data;
1904 1.137 simonb int a_fflag;
1905 1.176 elad kauth_cred_t a_cred;
1906 1.137 simonb } */ *ap = v;
1907 1.222 christos struct timeval tv;
1908 1.89 perseant struct timeval *tvp;
1909 1.89 perseant BLOCK_INFO *blkiov;
1910 1.283 dholland BLOCK_INFO_70 *blkiov70;
1911 1.92 perseant CLEANERINFO *cip;
1912 1.148 perseant SEGUSE *sup;
1913 1.283 dholland int blkcnt, i, error;
1914 1.181 martin size_t fh_size;
1915 1.90 perseant struct lfs_fcntl_markv blkvp;
1916 1.283 dholland struct lfs_fcntl_markv_70 blkvp70;
1917 1.185 ad struct lwp *l;
1918 1.89 perseant fsid_t *fsidp;
1919 1.92 perseant struct lfs *fs;
1920 1.92 perseant struct buf *bp;
1921 1.134 perseant fhandle_t *fhp;
1922 1.92 perseant daddr_t off;
1923 1.258 christos int oclean;
1924 1.89 perseant
1925 1.90 perseant /* Only respect LFS fcntls on fs root or Ifile */
1926 1.245 dholland if (VTOI(ap->a_vp)->i_number != ULFS_ROOTINO &&
1927 1.89 perseant VTOI(ap->a_vp)->i_number != LFS_IFILE_INUM) {
1928 1.245 dholland return ulfs_fcntl(v);
1929 1.89 perseant }
1930 1.89 perseant
1931 1.100 perseant /* Avoid locking a draining lock */
1932 1.119 dbj if (ap->a_vp->v_mount->mnt_iflag & IMNT_UNMOUNT) {
1933 1.100 perseant return ESHUTDOWN;
1934 1.100 perseant }
1935 1.100 perseant
1936 1.184 perseant /* LFS control and monitoring fcntls are available only to root */
1937 1.213 pooka l = curlwp;
1938 1.184 perseant if (((ap->a_command & 0xff00) >> 8) == 'L' &&
1939 1.241 elad (error = kauth_authorize_system(l->l_cred, KAUTH_SYSTEM_LFS,
1940 1.241 elad KAUTH_REQ_SYSTEM_LFS_FCNTL, NULL, NULL, NULL)) != 0)
1941 1.184 perseant return (error);
1942 1.184 perseant
1943 1.100 perseant fs = VTOI(ap->a_vp)->i_lfs;
1944 1.131 christos fsidp = &ap->a_vp->v_mount->mnt_stat.f_fsidx;
1945 1.89 perseant
1946 1.188 perseant error = 0;
1947 1.218 gmcgarry switch ((int)ap->a_command) {
1948 1.222 christos case LFCNSEGWAITALL_COMPAT_50:
1949 1.222 christos case LFCNSEGWAITALL_COMPAT:
1950 1.222 christos fsidp = NULL;
1951 1.283 dholland /* FALLTHROUGH */
1952 1.222 christos case LFCNSEGWAIT_COMPAT_50:
1953 1.222 christos case LFCNSEGWAIT_COMPAT:
1954 1.222 christos {
1955 1.222 christos struct timeval50 *tvp50
1956 1.222 christos = (struct timeval50 *)ap->a_data;
1957 1.222 christos timeval50_to_timeval(tvp50, &tv);
1958 1.222 christos tvp = &tv;
1959 1.222 christos }
1960 1.222 christos goto segwait_common;
1961 1.90 perseant case LFCNSEGWAITALL:
1962 1.214 ad fsidp = NULL;
1963 1.283 dholland /* FALLTHROUGH */
1964 1.90 perseant case LFCNSEGWAIT:
1965 1.214 ad tvp = (struct timeval *)ap->a_data;
1966 1.222 christos segwait_common:
1967 1.214 ad mutex_enter(&lfs_lock);
1968 1.214 ad ++fs->lfs_sleepers;
1969 1.214 ad mutex_exit(&lfs_lock);
1970 1.214 ad
1971 1.214 ad error = lfs_segwait(fsidp, tvp);
1972 1.214 ad
1973 1.214 ad mutex_enter(&lfs_lock);
1974 1.214 ad if (--fs->lfs_sleepers == 0)
1975 1.308 maya cv_broadcast(&fs->lfs_sleeperscv);
1976 1.214 ad mutex_exit(&lfs_lock);
1977 1.214 ad return error;
1978 1.89 perseant
1979 1.283 dholland case LFCNBMAPV_COMPAT_70:
1980 1.283 dholland case LFCNMARKV_COMPAT_70:
1981 1.283 dholland blkvp70 = *(struct lfs_fcntl_markv_70 *)ap->a_data;
1982 1.283 dholland
1983 1.283 dholland blkcnt = blkvp70.blkcnt;
1984 1.283 dholland if ((u_int) blkcnt > LFS_MARKV_MAXBLKCNT)
1985 1.283 dholland return (EINVAL);
1986 1.283 dholland blkiov = lfs_malloc(fs, blkcnt * sizeof(BLOCK_INFO), LFS_NB_BLKIOV);
1987 1.283 dholland blkiov70 = lfs_malloc(fs, sizeof(BLOCK_INFO_70), LFS_NB_BLKIOV);
1988 1.283 dholland for (i = 0; i < blkcnt; i++) {
1989 1.283 dholland error = copyin(&blkvp70.blkiov[i], blkiov70,
1990 1.283 dholland sizeof(*blkiov70));
1991 1.283 dholland if (error) {
1992 1.283 dholland lfs_free(fs, blkiov70, LFS_NB_BLKIOV);
1993 1.283 dholland lfs_free(fs, blkiov, LFS_NB_BLKIOV);
1994 1.283 dholland return error;
1995 1.283 dholland }
1996 1.283 dholland block_info_from_70(&blkiov[i], blkiov70);
1997 1.283 dholland }
1998 1.283 dholland
1999 1.283 dholland mutex_enter(&lfs_lock);
2000 1.283 dholland ++fs->lfs_sleepers;
2001 1.283 dholland mutex_exit(&lfs_lock);
2002 1.283 dholland if (ap->a_command == LFCNBMAPV)
2003 1.283 dholland error = lfs_bmapv(l, fsidp, blkiov, blkcnt);
2004 1.283 dholland else /* LFCNMARKV */
2005 1.283 dholland error = lfs_markv(l, fsidp, blkiov, blkcnt);
2006 1.283 dholland if (error == 0) {
2007 1.283 dholland for (i = 0; i < blkcnt; i++) {
2008 1.283 dholland block_info_to_70(blkiov70, &blkiov[i]);
2009 1.283 dholland error = copyout(blkiov70, &blkvp70.blkiov[i],
2010 1.283 dholland sizeof(*blkiov70));
2011 1.283 dholland if (error) {
2012 1.283 dholland break;
2013 1.283 dholland }
2014 1.283 dholland }
2015 1.283 dholland }
2016 1.283 dholland mutex_enter(&lfs_lock);
2017 1.283 dholland if (--fs->lfs_sleepers == 0)
2018 1.308 maya cv_broadcast(&fs->lfs_sleeperscv);
2019 1.283 dholland mutex_exit(&lfs_lock);
2020 1.283 dholland lfs_free(fs, blkiov, LFS_NB_BLKIOV);
2021 1.283 dholland return error;
2022 1.283 dholland
2023 1.90 perseant case LFCNBMAPV:
2024 1.90 perseant case LFCNMARKV:
2025 1.214 ad blkvp = *(struct lfs_fcntl_markv *)ap->a_data;
2026 1.89 perseant
2027 1.214 ad blkcnt = blkvp.blkcnt;
2028 1.214 ad if ((u_int) blkcnt > LFS_MARKV_MAXBLKCNT)
2029 1.214 ad return (EINVAL);
2030 1.214 ad blkiov = lfs_malloc(fs, blkcnt * sizeof(BLOCK_INFO), LFS_NB_BLKIOV);
2031 1.214 ad if ((error = copyin(blkvp.blkiov, blkiov,
2032 1.214 ad blkcnt * sizeof(BLOCK_INFO))) != 0) {
2033 1.214 ad lfs_free(fs, blkiov, LFS_NB_BLKIOV);
2034 1.214 ad return error;
2035 1.214 ad }
2036 1.214 ad
2037 1.214 ad mutex_enter(&lfs_lock);
2038 1.214 ad ++fs->lfs_sleepers;
2039 1.214 ad mutex_exit(&lfs_lock);
2040 1.214 ad if (ap->a_command == LFCNBMAPV)
2041 1.282 dholland error = lfs_bmapv(l, fsidp, blkiov, blkcnt);
2042 1.214 ad else /* LFCNMARKV */
2043 1.282 dholland error = lfs_markv(l, fsidp, blkiov, blkcnt);
2044 1.214 ad if (error == 0)
2045 1.214 ad error = copyout(blkiov, blkvp.blkiov,
2046 1.214 ad blkcnt * sizeof(BLOCK_INFO));
2047 1.214 ad mutex_enter(&lfs_lock);
2048 1.214 ad if (--fs->lfs_sleepers == 0)
2049 1.308 maya cv_broadcast(&fs->lfs_sleeperscv);
2050 1.214 ad mutex_exit(&lfs_lock);
2051 1.214 ad lfs_free(fs, blkiov, LFS_NB_BLKIOV);
2052 1.214 ad return error;
2053 1.92 perseant
2054 1.92 perseant case LFCNRECLAIM:
2055 1.214 ad /*
2056 1.214 ad * Flush dirops and write Ifile, allowing empty segments
2057 1.214 ad * to be immediately reclaimed.
2058 1.214 ad */
2059 1.214 ad lfs_writer_enter(fs, "pndirop");
2060 1.274 dholland off = lfs_sb_getoffset(fs);
2061 1.214 ad lfs_seglock(fs, SEGM_FORCE_CKP | SEGM_CKP);
2062 1.214 ad lfs_flush_dirops(fs);
2063 1.214 ad LFS_CLEANERINFO(cip, fs, bp);
2064 1.284 dholland oclean = lfs_ci_getclean(fs, cip);
2065 1.214 ad LFS_SYNC_CLEANERINFO(cip, fs, bp, 1);
2066 1.214 ad lfs_segwrite(ap->a_vp->v_mount, SEGM_FORCE_CKP);
2067 1.214 ad fs->lfs_sp->seg_flags |= SEGM_PROT;
2068 1.214 ad lfs_segunlock(fs);
2069 1.214 ad lfs_writer_leave(fs);
2070 1.92 perseant
2071 1.136 perseant #ifdef DEBUG
2072 1.214 ad LFS_CLEANERINFO(cip, fs, bp);
2073 1.214 ad DLOG((DLOG_CLEAN, "lfs_fcntl: reclaim wrote %" PRId64
2074 1.214 ad " blocks, cleaned %" PRId32 " segments (activesb %d)\n",
2075 1.284 dholland lfs_sb_getoffset(fs) - off,
2076 1.284 dholland lfs_ci_getclean(fs, cip) - oclean,
2077 1.214 ad fs->lfs_activesb));
2078 1.214 ad LFS_SYNC_CLEANERINFO(cip, fs, bp, 0);
2079 1.258 christos #else
2080 1.258 christos __USE(oclean);
2081 1.258 christos __USE(off);
2082 1.92 perseant #endif
2083 1.92 perseant
2084 1.214 ad return 0;
2085 1.89 perseant
2086 1.182 martin case LFCNIFILEFH_COMPAT:
2087 1.214 ad /* Return the filehandle of the Ifile */
2088 1.221 elad if ((error = kauth_authorize_system(l->l_cred,
2089 1.221 elad KAUTH_SYSTEM_FILEHANDLE, 0, NULL, NULL, NULL)) != 0)
2090 1.214 ad return (error);
2091 1.214 ad fhp = (struct fhandle *)ap->a_data;
2092 1.214 ad fhp->fh_fsid = *fsidp;
2093 1.214 ad fh_size = 16; /* former VFS_MAXFIDSIZ */
2094 1.214 ad return lfs_vptofh(fs->lfs_ivnode, &(fhp->fh_fid), &fh_size);
2095 1.182 martin
2096 1.187 martin case LFCNIFILEFH_COMPAT2:
2097 1.134 perseant case LFCNIFILEFH:
2098 1.214 ad /* Return the filehandle of the Ifile */
2099 1.214 ad fhp = (struct fhandle *)ap->a_data;
2100 1.214 ad fhp->fh_fsid = *fsidp;
2101 1.214 ad fh_size = sizeof(struct lfs_fhandle) -
2102 1.214 ad offsetof(fhandle_t, fh_fid);
2103 1.214 ad return lfs_vptofh(fs->lfs_ivnode, &(fhp->fh_fid), &fh_size);
2104 1.134 perseant
2105 1.148 perseant case LFCNREWIND:
2106 1.214 ad /* Move lfs_offset to the lowest-numbered segment */
2107 1.214 ad return lfs_rewind(fs, *(int *)ap->a_data);
2108 1.148 perseant
2109 1.148 perseant case LFCNINVAL:
2110 1.214 ad /* Mark a segment SEGUSE_INVAL */
2111 1.214 ad LFS_SEGENTRY(sup, fs, *(int *)ap->a_data, bp);
2112 1.214 ad if (sup->su_nbytes > 0) {
2113 1.214 ad brelse(bp, 0);
2114 1.214 ad lfs_unset_inval_all(fs);
2115 1.214 ad return EBUSY;
2116 1.214 ad }
2117 1.214 ad sup->su_flags |= SEGUSE_INVAL;
2118 1.236 hannken VOP_BWRITE(bp->b_vp, bp);
2119 1.214 ad return 0;
2120 1.148 perseant
2121 1.148 perseant case LFCNRESIZE:
2122 1.214 ad /* Resize the filesystem */
2123 1.214 ad return lfs_resize_fs(fs, *(int *)ap->a_data);
2124 1.148 perseant
2125 1.168 perseant case LFCNWRAPSTOP:
2126 1.179 perseant case LFCNWRAPSTOP_COMPAT:
2127 1.214 ad /*
2128 1.214 ad * Hold lfs_newseg at segment 0; if requested, sleep until
2129 1.214 ad * the filesystem wraps around. To support external agents
2130 1.214 ad * (dump, fsck-based regression test) that need to look at
2131 1.214 ad * a snapshot of the filesystem, without necessarily
2132 1.214 ad * requiring that all fs activity stops.
2133 1.214 ad */
2134 1.214 ad if (fs->lfs_stoplwp == curlwp)
2135 1.214 ad return EALREADY;
2136 1.214 ad
2137 1.214 ad mutex_enter(&lfs_lock);
2138 1.214 ad while (fs->lfs_stoplwp != NULL)
2139 1.214 ad cv_wait(&fs->lfs_stopcv, &lfs_lock);
2140 1.214 ad fs->lfs_stoplwp = curlwp;
2141 1.214 ad if (fs->lfs_nowrap == 0)
2142 1.275 dholland log(LOG_NOTICE, "%s: disabled log wrap\n",
2143 1.275 dholland lfs_sb_getfsmnt(fs));
2144 1.214 ad ++fs->lfs_nowrap;
2145 1.222 christos if (*(int *)ap->a_data == 1
2146 1.224 pooka || ap->a_command == LFCNWRAPSTOP_COMPAT) {
2147 1.214 ad log(LOG_NOTICE, "LFCNSTOPWRAP waiting for log wrap\n");
2148 1.214 ad error = mtsleep(&fs->lfs_nowrap, PCATCH | PUSER,
2149 1.214 ad "segwrap", 0, &lfs_lock);
2150 1.214 ad log(LOG_NOTICE, "LFCNSTOPWRAP done waiting\n");
2151 1.214 ad if (error) {
2152 1.214 ad lfs_wrapgo(fs, VTOI(ap->a_vp), 0);
2153 1.214 ad }
2154 1.214 ad }
2155 1.214 ad mutex_exit(&lfs_lock);
2156 1.214 ad return 0;
2157 1.168 perseant
2158 1.168 perseant case LFCNWRAPGO:
2159 1.179 perseant case LFCNWRAPGO_COMPAT:
2160 1.214 ad /*
2161 1.214 ad * Having done its work, the agent wakes up the writer.
2162 1.214 ad * If the argument is 1, it sleeps until a new segment
2163 1.214 ad * is selected.
2164 1.214 ad */
2165 1.214 ad mutex_enter(&lfs_lock);
2166 1.214 ad error = lfs_wrapgo(fs, VTOI(ap->a_vp),
2167 1.222 christos ap->a_command == LFCNWRAPGO_COMPAT ? 1 :
2168 1.222 christos *((int *)ap->a_data));
2169 1.214 ad mutex_exit(&lfs_lock);
2170 1.214 ad return error;
2171 1.168 perseant
2172 1.188 perseant case LFCNWRAPPASS:
2173 1.214 ad if ((VTOI(ap->a_vp)->i_lfs_iflags & LFSI_WRAPWAIT))
2174 1.214 ad return EALREADY;
2175 1.214 ad mutex_enter(&lfs_lock);
2176 1.214 ad if (fs->lfs_stoplwp != curlwp) {
2177 1.214 ad mutex_exit(&lfs_lock);
2178 1.214 ad return EALREADY;
2179 1.214 ad }
2180 1.214 ad if (fs->lfs_nowrap == 0) {
2181 1.214 ad mutex_exit(&lfs_lock);
2182 1.214 ad return EBUSY;
2183 1.214 ad }
2184 1.214 ad fs->lfs_wrappass = 1;
2185 1.214 ad wakeup(&fs->lfs_wrappass);
2186 1.214 ad /* Wait for the log to wrap, if asked */
2187 1.214 ad if (*(int *)ap->a_data) {
2188 1.272 hannken vref(ap->a_vp);
2189 1.214 ad VTOI(ap->a_vp)->i_lfs_iflags |= LFSI_WRAPWAIT;
2190 1.214 ad log(LOG_NOTICE, "LFCNPASS waiting for log wrap\n");
2191 1.214 ad error = mtsleep(&fs->lfs_nowrap, PCATCH | PUSER,
2192 1.214 ad "segwrap", 0, &lfs_lock);
2193 1.214 ad log(LOG_NOTICE, "LFCNPASS done waiting\n");
2194 1.214 ad VTOI(ap->a_vp)->i_lfs_iflags &= ~LFSI_WRAPWAIT;
2195 1.272 hannken vrele(ap->a_vp);
2196 1.214 ad }
2197 1.214 ad mutex_exit(&lfs_lock);
2198 1.214 ad return error;
2199 1.188 perseant
2200 1.188 perseant case LFCNWRAPSTATUS:
2201 1.214 ad mutex_enter(&lfs_lock);
2202 1.214 ad *(int *)ap->a_data = fs->lfs_wrapstatus;
2203 1.214 ad mutex_exit(&lfs_lock);
2204 1.214 ad return 0;
2205 1.188 perseant
2206 1.89 perseant default:
2207 1.245 dholland return ulfs_fcntl(v);
2208 1.89 perseant }
2209 1.89 perseant return 0;
2210 1.60 chs }
2211 1.60 chs
2212 1.84 perseant /*
2213 1.84 perseant * Return the last logical file offset that should be written for this file
2214 1.86 perseant * if we're doing a write that ends at "size". If writing, we need to know
2215 1.84 perseant * about sizes on disk, i.e. fragments if there are any; if reading, we need
2216 1.84 perseant * to know about entire blocks.
2217 1.84 perseant */
2218 1.84 perseant void
2219 1.84 perseant lfs_gop_size(struct vnode *vp, off_t size, off_t *eobp, int flags)
2220 1.84 perseant {
2221 1.84 perseant struct inode *ip = VTOI(vp);
2222 1.135 perry struct lfs *fs = ip->i_lfs;
2223 1.84 perseant daddr_t olbn, nlbn;
2224 1.84 perseant
2225 1.248 christos olbn = lfs_lblkno(fs, ip->i_size);
2226 1.248 christos nlbn = lfs_lblkno(fs, size);
2227 1.245 dholland if (!(flags & GOP_SIZE_MEM) && nlbn < ULFS_NDADDR && olbn <= nlbn) {
2228 1.248 christos *eobp = lfs_fragroundup(fs, size);
2229 1.86 perseant } else {
2230 1.248 christos *eobp = lfs_blkroundup(fs, size);
2231 1.86 perseant }
2232 1.84 perseant }
2233 1.84 perseant
2234 1.84 perseant #ifdef DEBUG
2235 1.84 perseant void lfs_dump_vop(void *);
2236 1.84 perseant
2237 1.84 perseant void
2238 1.84 perseant lfs_dump_vop(void *v)
2239 1.84 perseant {
2240 1.86 perseant struct vop_putpages_args /* {
2241 1.86 perseant struct vnode *a_vp;
2242 1.86 perseant voff_t a_offlo;
2243 1.86 perseant voff_t a_offhi;
2244 1.86 perseant int a_flags;
2245 1.86 perseant } */ *ap = v;
2246 1.84 perseant
2247 1.286 dholland struct inode *ip = VTOI(ap->a_vp);
2248 1.286 dholland struct lfs *fs = ip->i_lfs;
2249 1.286 dholland
2250 1.106 ragge #ifdef DDB
2251 1.84 perseant vfs_vnode_print(ap->a_vp, 0, printf);
2252 1.106 ragge #endif
2253 1.287 dholland lfs_dump_dinode(fs, ip->i_din);
2254 1.84 perseant }
2255 1.84 perseant #endif
2256 1.84 perseant
2257 1.84 perseant int
2258 1.84 perseant lfs_mmap(void *v)
2259 1.84 perseant {
2260 1.84 perseant struct vop_mmap_args /* {
2261 1.86 perseant const struct vnodeop_desc *a_desc;
2262 1.86 perseant struct vnode *a_vp;
2263 1.209 pooka vm_prot_t a_prot;
2264 1.176 elad kauth_cred_t a_cred;
2265 1.84 perseant } */ *ap = v;
2266 1.84 perseant
2267 1.84 perseant if (VTOI(ap->a_vp)->i_number == LFS_IFILE_INUM)
2268 1.84 perseant return EOPNOTSUPP;
2269 1.245 dholland return ulfs_mmap(v);
2270 1.84 perseant }
2271 1.254 dholland
2272 1.254 dholland static int
2273 1.254 dholland lfs_openextattr(void *v)
2274 1.254 dholland {
2275 1.254 dholland struct vop_openextattr_args /* {
2276 1.254 dholland struct vnode *a_vp;
2277 1.254 dholland kauth_cred_t a_cred;
2278 1.254 dholland struct proc *a_p;
2279 1.254 dholland } */ *ap = v;
2280 1.311 riastrad struct vnode *vp = ap->a_vp;
2281 1.311 riastrad struct inode *ip;
2282 1.311 riastrad struct ulfsmount *ump;
2283 1.311 riastrad
2284 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
2285 1.311 riastrad
2286 1.311 riastrad ip = VTOI(vp);
2287 1.311 riastrad ump = ip->i_ump;
2288 1.254 dholland
2289 1.254 dholland /* Not supported for ULFS1 file systems. */
2290 1.254 dholland if (ump->um_fstype == ULFS1)
2291 1.254 dholland return (EOPNOTSUPP);
2292 1.254 dholland
2293 1.254 dholland /* XXX Not implemented for ULFS2 file systems. */
2294 1.254 dholland return (EOPNOTSUPP);
2295 1.254 dholland }
2296 1.254 dholland
2297 1.254 dholland static int
2298 1.254 dholland lfs_closeextattr(void *v)
2299 1.254 dholland {
2300 1.254 dholland struct vop_closeextattr_args /* {
2301 1.254 dholland struct vnode *a_vp;
2302 1.254 dholland int a_commit;
2303 1.254 dholland kauth_cred_t a_cred;
2304 1.254 dholland struct proc *a_p;
2305 1.254 dholland } */ *ap = v;
2306 1.311 riastrad struct vnode *vp = ap->a_vp;
2307 1.311 riastrad struct inode *ip;
2308 1.311 riastrad struct ulfsmount *ump;
2309 1.311 riastrad
2310 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
2311 1.311 riastrad
2312 1.312 riastrad ip = VTOI(vp);
2313 1.311 riastrad ump = ip->i_ump;
2314 1.254 dholland
2315 1.254 dholland /* Not supported for ULFS1 file systems. */
2316 1.254 dholland if (ump->um_fstype == ULFS1)
2317 1.254 dholland return (EOPNOTSUPP);
2318 1.254 dholland
2319 1.254 dholland /* XXX Not implemented for ULFS2 file systems. */
2320 1.254 dholland return (EOPNOTSUPP);
2321 1.254 dholland }
2322 1.254 dholland
2323 1.254 dholland static int
2324 1.254 dholland lfs_getextattr(void *v)
2325 1.254 dholland {
2326 1.254 dholland struct vop_getextattr_args /* {
2327 1.254 dholland struct vnode *a_vp;
2328 1.254 dholland int a_attrnamespace;
2329 1.254 dholland const char *a_name;
2330 1.254 dholland struct uio *a_uio;
2331 1.254 dholland size_t *a_size;
2332 1.254 dholland kauth_cred_t a_cred;
2333 1.254 dholland struct proc *a_p;
2334 1.254 dholland } */ *ap = v;
2335 1.254 dholland struct vnode *vp = ap->a_vp;
2336 1.311 riastrad struct inode *ip;
2337 1.311 riastrad struct ulfsmount *ump;
2338 1.254 dholland int error;
2339 1.254 dholland
2340 1.311 riastrad KASSERT(VOP_ISLOCKED(vp));
2341 1.311 riastrad
2342 1.311 riastrad ip = VTOI(vp);
2343 1.311 riastrad ump = ip->i_ump;
2344 1.311 riastrad
2345 1.254 dholland if (ump->um_fstype == ULFS1) {
2346 1.254 dholland #ifdef LFS_EXTATTR
2347 1.254 dholland error = ulfs_getextattr(ap);
2348 1.254 dholland #else
2349 1.254 dholland error = EOPNOTSUPP;
2350 1.254 dholland #endif
2351 1.254 dholland return error;
2352 1.254 dholland }
2353 1.254 dholland
2354 1.254 dholland /* XXX Not implemented for ULFS2 file systems. */
2355 1.254 dholland return (EOPNOTSUPP);
2356 1.254 dholland }
2357 1.254 dholland
2358 1.254 dholland static int
2359 1.254 dholland lfs_setextattr(void *v)
2360 1.254 dholland {
2361 1.254 dholland struct vop_setextattr_args /* {
2362 1.254 dholland struct vnode *a_vp;
2363 1.254 dholland int a_attrnamespace;
2364 1.254 dholland const char *a_name;
2365 1.254 dholland struct uio *a_uio;
2366 1.254 dholland kauth_cred_t a_cred;
2367 1.254 dholland struct proc *a_p;
2368 1.254 dholland } */ *ap = v;
2369 1.254 dholland struct vnode *vp = ap->a_vp;
2370 1.311 riastrad struct inode *ip;
2371 1.311 riastrad struct ulfsmount *ump;
2372 1.254 dholland int error;
2373 1.254 dholland
2374 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
2375 1.311 riastrad
2376 1.311 riastrad ip = VTOI(vp);
2377 1.311 riastrad ump = ip->i_ump;
2378 1.311 riastrad
2379 1.254 dholland if (ump->um_fstype == ULFS1) {
2380 1.254 dholland #ifdef LFS_EXTATTR
2381 1.254 dholland error = ulfs_setextattr(ap);
2382 1.254 dholland #else
2383 1.254 dholland error = EOPNOTSUPP;
2384 1.254 dholland #endif
2385 1.254 dholland return error;
2386 1.254 dholland }
2387 1.254 dholland
2388 1.254 dholland /* XXX Not implemented for ULFS2 file systems. */
2389 1.254 dholland return (EOPNOTSUPP);
2390 1.254 dholland }
2391 1.254 dholland
2392 1.254 dholland static int
2393 1.254 dholland lfs_listextattr(void *v)
2394 1.254 dholland {
2395 1.254 dholland struct vop_listextattr_args /* {
2396 1.254 dholland struct vnode *a_vp;
2397 1.254 dholland int a_attrnamespace;
2398 1.254 dholland struct uio *a_uio;
2399 1.254 dholland size_t *a_size;
2400 1.254 dholland kauth_cred_t a_cred;
2401 1.254 dholland struct proc *a_p;
2402 1.254 dholland } */ *ap = v;
2403 1.254 dholland struct vnode *vp = ap->a_vp;
2404 1.311 riastrad struct inode *ip;
2405 1.311 riastrad struct ulfsmount *ump;
2406 1.254 dholland int error;
2407 1.254 dholland
2408 1.311 riastrad KASSERT(VOP_ISLOCKED(vp));
2409 1.311 riastrad
2410 1.311 riastrad ip = VTOI(vp);
2411 1.311 riastrad ump = ip->i_ump;
2412 1.311 riastrad
2413 1.254 dholland if (ump->um_fstype == ULFS1) {
2414 1.254 dholland #ifdef LFS_EXTATTR
2415 1.254 dholland error = ulfs_listextattr(ap);
2416 1.254 dholland #else
2417 1.254 dholland error = EOPNOTSUPP;
2418 1.254 dholland #endif
2419 1.254 dholland return error;
2420 1.254 dholland }
2421 1.254 dholland
2422 1.254 dholland /* XXX Not implemented for ULFS2 file systems. */
2423 1.254 dholland return (EOPNOTSUPP);
2424 1.254 dholland }
2425 1.254 dholland
2426 1.254 dholland static int
2427 1.254 dholland lfs_deleteextattr(void *v)
2428 1.254 dholland {
2429 1.254 dholland struct vop_deleteextattr_args /* {
2430 1.254 dholland struct vnode *a_vp;
2431 1.254 dholland int a_attrnamespace;
2432 1.254 dholland kauth_cred_t a_cred;
2433 1.254 dholland struct proc *a_p;
2434 1.254 dholland } */ *ap = v;
2435 1.254 dholland struct vnode *vp = ap->a_vp;
2436 1.311 riastrad struct inode *ip;
2437 1.311 riastrad struct ulfsmount *ump;
2438 1.254 dholland int error;
2439 1.254 dholland
2440 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
2441 1.311 riastrad
2442 1.311 riastrad ip = VTOI(vp);
2443 1.311 riastrad ump = ip->i_ump;
2444 1.311 riastrad
2445 1.254 dholland if (ump->um_fstype == ULFS1) {
2446 1.254 dholland #ifdef LFS_EXTATTR
2447 1.254 dholland error = ulfs_deleteextattr(ap);
2448 1.254 dholland #else
2449 1.254 dholland error = EOPNOTSUPP;
2450 1.254 dholland #endif
2451 1.254 dholland return error;
2452 1.254 dholland }
2453 1.254 dholland
2454 1.254 dholland /* XXX Not implemented for ULFS2 file systems. */
2455 1.254 dholland return (EOPNOTSUPP);
2456 1.254 dholland }
2457 1.299 dholland
2458