lfs_vnops.c revision 1.329 1 1.329 riastrad /* $NetBSD: lfs_vnops.c,v 1.329 2020/02/23 08:40:19 riastradh Exp $ */
2 1.2 cgd
3 1.22 perseant /*-
4 1.84 perseant * Copyright (c) 1999, 2000, 2001, 2002, 2003 The NetBSD Foundation, Inc.
5 1.22 perseant * All rights reserved.
6 1.22 perseant *
7 1.22 perseant * This code is derived from software contributed to The NetBSD Foundation
8 1.22 perseant * by Konrad E. Schroder <perseant (at) hhhh.org>.
9 1.22 perseant *
10 1.22 perseant * Redistribution and use in source and binary forms, with or without
11 1.22 perseant * modification, are permitted provided that the following conditions
12 1.22 perseant * are met:
13 1.22 perseant * 1. Redistributions of source code must retain the above copyright
14 1.22 perseant * notice, this list of conditions and the following disclaimer.
15 1.22 perseant * 2. Redistributions in binary form must reproduce the above copyright
16 1.22 perseant * notice, this list of conditions and the following disclaimer in the
17 1.22 perseant * documentation and/or other materials provided with the distribution.
18 1.22 perseant *
19 1.22 perseant * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.22 perseant * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.22 perseant * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.22 perseant * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.22 perseant * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.22 perseant * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.22 perseant * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.22 perseant * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.22 perseant * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.22 perseant * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.22 perseant * POSSIBILITY OF SUCH DAMAGE.
30 1.22 perseant */
31 1.1 mycroft /*
32 1.15 fvdl * Copyright (c) 1986, 1989, 1991, 1993, 1995
33 1.1 mycroft * The Regents of the University of California. All rights reserved.
34 1.1 mycroft *
35 1.1 mycroft * Redistribution and use in source and binary forms, with or without
36 1.1 mycroft * modification, are permitted provided that the following conditions
37 1.1 mycroft * are met:
38 1.1 mycroft * 1. Redistributions of source code must retain the above copyright
39 1.1 mycroft * notice, this list of conditions and the following disclaimer.
40 1.1 mycroft * 2. Redistributions in binary form must reproduce the above copyright
41 1.1 mycroft * notice, this list of conditions and the following disclaimer in the
42 1.1 mycroft * documentation and/or other materials provided with the distribution.
43 1.114 agc * 3. Neither the name of the University nor the names of its contributors
44 1.1 mycroft * may be used to endorse or promote products derived from this software
45 1.1 mycroft * without specific prior written permission.
46 1.1 mycroft *
47 1.1 mycroft * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
48 1.1 mycroft * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
49 1.1 mycroft * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
50 1.1 mycroft * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
51 1.1 mycroft * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
52 1.1 mycroft * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
53 1.1 mycroft * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
54 1.1 mycroft * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
55 1.1 mycroft * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
56 1.1 mycroft * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
57 1.1 mycroft * SUCH DAMAGE.
58 1.1 mycroft *
59 1.15 fvdl * @(#)lfs_vnops.c 8.13 (Berkeley) 6/10/95
60 1.1 mycroft */
61 1.58 lukem
62 1.302 dholland /* from NetBSD: ufs_vnops.c,v 1.232 2016/05/19 18:32:03 riastradh Exp */
63 1.265 dholland /*-
64 1.265 dholland * Copyright (c) 2008 The NetBSD Foundation, Inc.
65 1.265 dholland * All rights reserved.
66 1.265 dholland *
67 1.265 dholland * This code is derived from software contributed to The NetBSD Foundation
68 1.265 dholland * by Wasabi Systems, Inc.
69 1.265 dholland *
70 1.265 dholland * Redistribution and use in source and binary forms, with or without
71 1.265 dholland * modification, are permitted provided that the following conditions
72 1.265 dholland * are met:
73 1.265 dholland * 1. Redistributions of source code must retain the above copyright
74 1.265 dholland * notice, this list of conditions and the following disclaimer.
75 1.265 dholland * 2. Redistributions in binary form must reproduce the above copyright
76 1.265 dholland * notice, this list of conditions and the following disclaimer in the
77 1.265 dholland * documentation and/or other materials provided with the distribution.
78 1.265 dholland *
79 1.265 dholland * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
80 1.265 dholland * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
81 1.265 dholland * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
82 1.265 dholland * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
83 1.265 dholland * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
84 1.265 dholland * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
85 1.265 dholland * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
86 1.265 dholland * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
87 1.265 dholland * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
88 1.265 dholland * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
89 1.265 dholland * POSSIBILITY OF SUCH DAMAGE.
90 1.265 dholland */
91 1.265 dholland /*
92 1.265 dholland * Copyright (c) 1982, 1986, 1989, 1993, 1995
93 1.265 dholland * The Regents of the University of California. All rights reserved.
94 1.265 dholland * (c) UNIX System Laboratories, Inc.
95 1.265 dholland * All or some portions of this file are derived from material licensed
96 1.265 dholland * to the University of California by American Telephone and Telegraph
97 1.265 dholland * Co. or Unix System Laboratories, Inc. and are reproduced herein with
98 1.265 dholland * the permission of UNIX System Laboratories, Inc.
99 1.265 dholland *
100 1.265 dholland * Redistribution and use in source and binary forms, with or without
101 1.265 dholland * modification, are permitted provided that the following conditions
102 1.265 dholland * are met:
103 1.265 dholland * 1. Redistributions of source code must retain the above copyright
104 1.265 dholland * notice, this list of conditions and the following disclaimer.
105 1.265 dholland * 2. Redistributions in binary form must reproduce the above copyright
106 1.265 dholland * notice, this list of conditions and the following disclaimer in the
107 1.265 dholland * documentation and/or other materials provided with the distribution.
108 1.265 dholland * 3. Neither the name of the University nor the names of its contributors
109 1.265 dholland * may be used to endorse or promote products derived from this software
110 1.265 dholland * without specific prior written permission.
111 1.265 dholland *
112 1.265 dholland * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
113 1.265 dholland * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
114 1.265 dholland * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
115 1.265 dholland * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
116 1.265 dholland * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
117 1.265 dholland * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
118 1.265 dholland * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
119 1.265 dholland * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
120 1.265 dholland * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
121 1.265 dholland * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
122 1.265 dholland * SUCH DAMAGE.
123 1.265 dholland *
124 1.265 dholland * @(#)ufs_vnops.c 8.28 (Berkeley) 7/31/95
125 1.265 dholland */
126 1.265 dholland
127 1.58 lukem #include <sys/cdefs.h>
128 1.329 riastrad __KERNEL_RCSID(0, "$NetBSD: lfs_vnops.c,v 1.329 2020/02/23 08:40:19 riastradh Exp $");
129 1.182 martin
130 1.183 martin #ifdef _KERNEL_OPT
131 1.182 martin #include "opt_compat_netbsd.h"
132 1.238 chs #include "opt_uvm_page_trkown.h"
133 1.183 martin #endif
134 1.17 sommerfe
135 1.1 mycroft #include <sys/param.h>
136 1.1 mycroft #include <sys/systm.h>
137 1.1 mycroft #include <sys/namei.h>
138 1.1 mycroft #include <sys/resourcevar.h>
139 1.1 mycroft #include <sys/kernel.h>
140 1.1 mycroft #include <sys/file.h>
141 1.1 mycroft #include <sys/stat.h>
142 1.1 mycroft #include <sys/buf.h>
143 1.1 mycroft #include <sys/proc.h>
144 1.1 mycroft #include <sys/mount.h>
145 1.1 mycroft #include <sys/vnode.h>
146 1.19 thorpej #include <sys/pool.h>
147 1.10 christos #include <sys/signalvar.h>
148 1.176 elad #include <sys/kauth.h>
149 1.179 perseant #include <sys/syslog.h>
150 1.1 mycroft
151 1.12 mycroft #include <miscfs/fifofs/fifo.h>
152 1.12 mycroft #include <miscfs/genfs/genfs.h>
153 1.1 mycroft #include <miscfs/specfs/specdev.h>
154 1.1 mycroft
155 1.244 dholland #include <ufs/lfs/ulfs_inode.h>
156 1.244 dholland #include <ufs/lfs/ulfsmount.h>
157 1.244 dholland #include <ufs/lfs/ulfs_bswap.h>
158 1.244 dholland #include <ufs/lfs/ulfs_extern.h>
159 1.1 mycroft
160 1.84 perseant #include <uvm/uvm.h>
161 1.95 perseant #include <uvm/uvm_pmap.h>
162 1.95 perseant #include <uvm/uvm_stat.h>
163 1.95 perseant #include <uvm/uvm_pager.h>
164 1.84 perseant
165 1.1 mycroft #include <ufs/lfs/lfs.h>
166 1.278 dholland #include <ufs/lfs/lfs_accessors.h>
167 1.252 dholland #include <ufs/lfs/lfs_kernel.h>
168 1.1 mycroft #include <ufs/lfs/lfs_extern.h>
169 1.1 mycroft
170 1.310 maya extern kcondvar_t lfs_writerd_cv;
171 1.203 perseant int lfs_ignore_lazy_sync = 1;
172 1.203 perseant
173 1.254 dholland static int lfs_openextattr(void *v);
174 1.254 dholland static int lfs_closeextattr(void *v);
175 1.254 dholland static int lfs_getextattr(void *v);
176 1.254 dholland static int lfs_setextattr(void *v);
177 1.254 dholland static int lfs_listextattr(void *v);
178 1.254 dholland static int lfs_deleteextattr(void *v);
179 1.254 dholland
180 1.300 dholland static int lfs_makeinode(struct vattr *vap, struct vnode *,
181 1.299 dholland const struct ulfs_lookup_results *,
182 1.299 dholland struct vnode **, struct componentname *);
183 1.299 dholland
184 1.1 mycroft /* Global vfs data structures for lfs. */
185 1.51 perseant int (**lfs_vnodeop_p)(void *);
186 1.50 jdolecek const struct vnodeopv_entry_desc lfs_vnodeop_entries[] = {
187 1.1 mycroft { &vop_default_desc, vn_default_error },
188 1.245 dholland { &vop_lookup_desc, ulfs_lookup }, /* lookup */
189 1.22 perseant { &vop_create_desc, lfs_create }, /* create */
190 1.245 dholland { &vop_whiteout_desc, ulfs_whiteout }, /* whiteout */
191 1.22 perseant { &vop_mknod_desc, lfs_mknod }, /* mknod */
192 1.245 dholland { &vop_open_desc, ulfs_open }, /* open */
193 1.1 mycroft { &vop_close_desc, lfs_close }, /* close */
194 1.245 dholland { &vop_access_desc, ulfs_access }, /* access */
195 1.1 mycroft { &vop_getattr_desc, lfs_getattr }, /* getattr */
196 1.61 perseant { &vop_setattr_desc, lfs_setattr }, /* setattr */
197 1.1 mycroft { &vop_read_desc, lfs_read }, /* read */
198 1.1 mycroft { &vop_write_desc, lfs_write }, /* write */
199 1.269 dholland { &vop_fallocate_desc, genfs_eopnotsupp }, /* fallocate */
200 1.269 dholland { &vop_fdiscard_desc, genfs_eopnotsupp }, /* fdiscard */
201 1.245 dholland { &vop_ioctl_desc, ulfs_ioctl }, /* ioctl */
202 1.90 perseant { &vop_fcntl_desc, lfs_fcntl }, /* fcntl */
203 1.245 dholland { &vop_poll_desc, ulfs_poll }, /* poll */
204 1.68 jdolecek { &vop_kqfilter_desc, genfs_kqfilter }, /* kqfilter */
205 1.245 dholland { &vop_revoke_desc, ulfs_revoke }, /* revoke */
206 1.84 perseant { &vop_mmap_desc, lfs_mmap }, /* mmap */
207 1.1 mycroft { &vop_fsync_desc, lfs_fsync }, /* fsync */
208 1.245 dholland { &vop_seek_desc, ulfs_seek }, /* seek */
209 1.22 perseant { &vop_remove_desc, lfs_remove }, /* remove */
210 1.22 perseant { &vop_link_desc, lfs_link }, /* link */
211 1.22 perseant { &vop_rename_desc, lfs_rename }, /* rename */
212 1.22 perseant { &vop_mkdir_desc, lfs_mkdir }, /* mkdir */
213 1.22 perseant { &vop_rmdir_desc, lfs_rmdir }, /* rmdir */
214 1.22 perseant { &vop_symlink_desc, lfs_symlink }, /* symlink */
215 1.245 dholland { &vop_readdir_desc, ulfs_readdir }, /* readdir */
216 1.245 dholland { &vop_readlink_desc, ulfs_readlink }, /* readlink */
217 1.245 dholland { &vop_abortop_desc, ulfs_abortop }, /* abortop */
218 1.40 perseant { &vop_inactive_desc, lfs_inactive }, /* inactive */
219 1.1 mycroft { &vop_reclaim_desc, lfs_reclaim }, /* reclaim */
220 1.245 dholland { &vop_lock_desc, ulfs_lock }, /* lock */
221 1.245 dholland { &vop_unlock_desc, ulfs_unlock }, /* unlock */
222 1.245 dholland { &vop_bmap_desc, ulfs_bmap }, /* bmap */
223 1.94 perseant { &vop_strategy_desc, lfs_strategy }, /* strategy */
224 1.245 dholland { &vop_print_desc, ulfs_print }, /* print */
225 1.245 dholland { &vop_islocked_desc, ulfs_islocked }, /* islocked */
226 1.245 dholland { &vop_pathconf_desc, ulfs_pathconf }, /* pathconf */
227 1.245 dholland { &vop_advlock_desc, ulfs_advlock }, /* advlock */
228 1.1 mycroft { &vop_bwrite_desc, lfs_bwrite }, /* bwrite */
229 1.60 chs { &vop_getpages_desc, lfs_getpages }, /* getpages */
230 1.60 chs { &vop_putpages_desc, lfs_putpages }, /* putpages */
231 1.254 dholland { &vop_openextattr_desc, lfs_openextattr }, /* openextattr */
232 1.254 dholland { &vop_closeextattr_desc, lfs_closeextattr }, /* closeextattr */
233 1.254 dholland { &vop_getextattr_desc, lfs_getextattr }, /* getextattr */
234 1.254 dholland { &vop_setextattr_desc, lfs_setextattr }, /* setextattr */
235 1.254 dholland { &vop_listextattr_desc, lfs_listextattr }, /* listextattr */
236 1.254 dholland { &vop_deleteextattr_desc, lfs_deleteextattr }, /* deleteextattr */
237 1.53 chs { NULL, NULL }
238 1.1 mycroft };
239 1.50 jdolecek const struct vnodeopv_desc lfs_vnodeop_opv_desc =
240 1.1 mycroft { &lfs_vnodeop_p, lfs_vnodeop_entries };
241 1.1 mycroft
242 1.51 perseant int (**lfs_specop_p)(void *);
243 1.50 jdolecek const struct vnodeopv_entry_desc lfs_specop_entries[] = {
244 1.1 mycroft { &vop_default_desc, vn_default_error },
245 1.1 mycroft { &vop_lookup_desc, spec_lookup }, /* lookup */
246 1.1 mycroft { &vop_create_desc, spec_create }, /* create */
247 1.1 mycroft { &vop_mknod_desc, spec_mknod }, /* mknod */
248 1.1 mycroft { &vop_open_desc, spec_open }, /* open */
249 1.65 perseant { &vop_close_desc, lfsspec_close }, /* close */
250 1.245 dholland { &vop_access_desc, ulfs_access }, /* access */
251 1.1 mycroft { &vop_getattr_desc, lfs_getattr }, /* getattr */
252 1.61 perseant { &vop_setattr_desc, lfs_setattr }, /* setattr */
253 1.245 dholland { &vop_read_desc, ulfsspec_read }, /* read */
254 1.245 dholland { &vop_write_desc, ulfsspec_write }, /* write */
255 1.269 dholland { &vop_fallocate_desc, spec_fallocate }, /* fallocate */
256 1.269 dholland { &vop_fdiscard_desc, spec_fdiscard }, /* fdiscard */
257 1.1 mycroft { &vop_ioctl_desc, spec_ioctl }, /* ioctl */
258 1.245 dholland { &vop_fcntl_desc, ulfs_fcntl }, /* fcntl */
259 1.13 mycroft { &vop_poll_desc, spec_poll }, /* poll */
260 1.68 jdolecek { &vop_kqfilter_desc, spec_kqfilter }, /* kqfilter */
261 1.15 fvdl { &vop_revoke_desc, spec_revoke }, /* revoke */
262 1.1 mycroft { &vop_mmap_desc, spec_mmap }, /* mmap */
263 1.1 mycroft { &vop_fsync_desc, spec_fsync }, /* fsync */
264 1.1 mycroft { &vop_seek_desc, spec_seek }, /* seek */
265 1.1 mycroft { &vop_remove_desc, spec_remove }, /* remove */
266 1.1 mycroft { &vop_link_desc, spec_link }, /* link */
267 1.1 mycroft { &vop_rename_desc, spec_rename }, /* rename */
268 1.1 mycroft { &vop_mkdir_desc, spec_mkdir }, /* mkdir */
269 1.1 mycroft { &vop_rmdir_desc, spec_rmdir }, /* rmdir */
270 1.1 mycroft { &vop_symlink_desc, spec_symlink }, /* symlink */
271 1.1 mycroft { &vop_readdir_desc, spec_readdir }, /* readdir */
272 1.1 mycroft { &vop_readlink_desc, spec_readlink }, /* readlink */
273 1.1 mycroft { &vop_abortop_desc, spec_abortop }, /* abortop */
274 1.40 perseant { &vop_inactive_desc, lfs_inactive }, /* inactive */
275 1.1 mycroft { &vop_reclaim_desc, lfs_reclaim }, /* reclaim */
276 1.245 dholland { &vop_lock_desc, ulfs_lock }, /* lock */
277 1.245 dholland { &vop_unlock_desc, ulfs_unlock }, /* unlock */
278 1.1 mycroft { &vop_bmap_desc, spec_bmap }, /* bmap */
279 1.1 mycroft { &vop_strategy_desc, spec_strategy }, /* strategy */
280 1.245 dholland { &vop_print_desc, ulfs_print }, /* print */
281 1.245 dholland { &vop_islocked_desc, ulfs_islocked }, /* islocked */
282 1.1 mycroft { &vop_pathconf_desc, spec_pathconf }, /* pathconf */
283 1.1 mycroft { &vop_advlock_desc, spec_advlock }, /* advlock */
284 1.28 perseant { &vop_bwrite_desc, vn_bwrite }, /* bwrite */
285 1.53 chs { &vop_getpages_desc, spec_getpages }, /* getpages */
286 1.53 chs { &vop_putpages_desc, spec_putpages }, /* putpages */
287 1.254 dholland { &vop_openextattr_desc, lfs_openextattr }, /* openextattr */
288 1.254 dholland { &vop_closeextattr_desc, lfs_closeextattr }, /* closeextattr */
289 1.254 dholland { &vop_getextattr_desc, lfs_getextattr }, /* getextattr */
290 1.254 dholland { &vop_setextattr_desc, lfs_setextattr }, /* setextattr */
291 1.254 dholland { &vop_listextattr_desc, lfs_listextattr }, /* listextattr */
292 1.254 dholland { &vop_deleteextattr_desc, lfs_deleteextattr }, /* deleteextattr */
293 1.53 chs { NULL, NULL }
294 1.1 mycroft };
295 1.50 jdolecek const struct vnodeopv_desc lfs_specop_opv_desc =
296 1.1 mycroft { &lfs_specop_p, lfs_specop_entries };
297 1.1 mycroft
298 1.51 perseant int (**lfs_fifoop_p)(void *);
299 1.50 jdolecek const struct vnodeopv_entry_desc lfs_fifoop_entries[] = {
300 1.1 mycroft { &vop_default_desc, vn_default_error },
301 1.227 pooka { &vop_lookup_desc, vn_fifo_bypass }, /* lookup */
302 1.227 pooka { &vop_create_desc, vn_fifo_bypass }, /* create */
303 1.227 pooka { &vop_mknod_desc, vn_fifo_bypass }, /* mknod */
304 1.227 pooka { &vop_open_desc, vn_fifo_bypass }, /* open */
305 1.65 perseant { &vop_close_desc, lfsfifo_close }, /* close */
306 1.245 dholland { &vop_access_desc, ulfs_access }, /* access */
307 1.1 mycroft { &vop_getattr_desc, lfs_getattr }, /* getattr */
308 1.61 perseant { &vop_setattr_desc, lfs_setattr }, /* setattr */
309 1.245 dholland { &vop_read_desc, ulfsfifo_read }, /* read */
310 1.245 dholland { &vop_write_desc, ulfsfifo_write }, /* write */
311 1.269 dholland { &vop_fallocate_desc, vn_fifo_bypass }, /* fallocate */
312 1.269 dholland { &vop_fdiscard_desc, vn_fifo_bypass }, /* fdiscard */
313 1.227 pooka { &vop_ioctl_desc, vn_fifo_bypass }, /* ioctl */
314 1.245 dholland { &vop_fcntl_desc, ulfs_fcntl }, /* fcntl */
315 1.227 pooka { &vop_poll_desc, vn_fifo_bypass }, /* poll */
316 1.227 pooka { &vop_kqfilter_desc, vn_fifo_bypass }, /* kqfilter */
317 1.227 pooka { &vop_revoke_desc, vn_fifo_bypass }, /* revoke */
318 1.227 pooka { &vop_mmap_desc, vn_fifo_bypass }, /* mmap */
319 1.227 pooka { &vop_fsync_desc, vn_fifo_bypass }, /* fsync */
320 1.227 pooka { &vop_seek_desc, vn_fifo_bypass }, /* seek */
321 1.227 pooka { &vop_remove_desc, vn_fifo_bypass }, /* remove */
322 1.227 pooka { &vop_link_desc, vn_fifo_bypass }, /* link */
323 1.227 pooka { &vop_rename_desc, vn_fifo_bypass }, /* rename */
324 1.227 pooka { &vop_mkdir_desc, vn_fifo_bypass }, /* mkdir */
325 1.227 pooka { &vop_rmdir_desc, vn_fifo_bypass }, /* rmdir */
326 1.227 pooka { &vop_symlink_desc, vn_fifo_bypass }, /* symlink */
327 1.227 pooka { &vop_readdir_desc, vn_fifo_bypass }, /* readdir */
328 1.227 pooka { &vop_readlink_desc, vn_fifo_bypass }, /* readlink */
329 1.227 pooka { &vop_abortop_desc, vn_fifo_bypass }, /* abortop */
330 1.40 perseant { &vop_inactive_desc, lfs_inactive }, /* inactive */
331 1.1 mycroft { &vop_reclaim_desc, lfs_reclaim }, /* reclaim */
332 1.245 dholland { &vop_lock_desc, ulfs_lock }, /* lock */
333 1.245 dholland { &vop_unlock_desc, ulfs_unlock }, /* unlock */
334 1.227 pooka { &vop_bmap_desc, vn_fifo_bypass }, /* bmap */
335 1.227 pooka { &vop_strategy_desc, vn_fifo_bypass }, /* strategy */
336 1.245 dholland { &vop_print_desc, ulfs_print }, /* print */
337 1.245 dholland { &vop_islocked_desc, ulfs_islocked }, /* islocked */
338 1.227 pooka { &vop_pathconf_desc, vn_fifo_bypass }, /* pathconf */
339 1.227 pooka { &vop_advlock_desc, vn_fifo_bypass }, /* advlock */
340 1.1 mycroft { &vop_bwrite_desc, lfs_bwrite }, /* bwrite */
341 1.227 pooka { &vop_putpages_desc, vn_fifo_bypass }, /* putpages */
342 1.254 dholland { &vop_openextattr_desc, lfs_openextattr }, /* openextattr */
343 1.254 dholland { &vop_closeextattr_desc, lfs_closeextattr }, /* closeextattr */
344 1.254 dholland { &vop_getextattr_desc, lfs_getextattr }, /* getextattr */
345 1.254 dholland { &vop_setextattr_desc, lfs_setextattr }, /* setextattr */
346 1.254 dholland { &vop_listextattr_desc, lfs_listextattr }, /* listextattr */
347 1.254 dholland { &vop_deleteextattr_desc, lfs_deleteextattr }, /* deleteextattr */
348 1.53 chs { NULL, NULL }
349 1.1 mycroft };
350 1.50 jdolecek const struct vnodeopv_desc lfs_fifoop_opv_desc =
351 1.1 mycroft { &lfs_fifoop_p, lfs_fifoop_entries };
352 1.1 mycroft
353 1.244 dholland #include <ufs/lfs/ulfs_readwrite.c>
354 1.1 mycroft
355 1.1 mycroft /*
356 1.299 dholland * Allocate a new inode.
357 1.299 dholland */
358 1.299 dholland static int
359 1.300 dholland lfs_makeinode(struct vattr *vap, struct vnode *dvp,
360 1.299 dholland const struct ulfs_lookup_results *ulr,
361 1.299 dholland struct vnode **vpp, struct componentname *cnp)
362 1.299 dholland {
363 1.299 dholland struct inode *ip;
364 1.299 dholland struct vnode *tvp;
365 1.299 dholland int error;
366 1.299 dholland
367 1.323 hannken error = vcache_new(dvp->v_mount, dvp, vap, cnp->cn_cred, NULL, &tvp);
368 1.299 dholland if (error)
369 1.299 dholland return error;
370 1.299 dholland error = vn_lock(tvp, LK_EXCLUSIVE);
371 1.299 dholland if (error) {
372 1.299 dholland vrele(tvp);
373 1.299 dholland return error;
374 1.299 dholland }
375 1.319 maya MARK_VNODE(tvp);
376 1.299 dholland *vpp = tvp;
377 1.299 dholland ip = VTOI(tvp);
378 1.317 maya ip->i_state |= IN_ACCESS | IN_CHANGE | IN_UPDATE;
379 1.299 dholland ip->i_nlink = 1;
380 1.299 dholland DIP_ASSIGN(ip, nlink, 1);
381 1.299 dholland
382 1.299 dholland /* Authorize setting SGID if needed. */
383 1.299 dholland if (ip->i_mode & ISGID) {
384 1.299 dholland error = kauth_authorize_vnode(cnp->cn_cred, KAUTH_VNODE_WRITE_SECURITY,
385 1.299 dholland tvp, NULL, genfs_can_chmod(tvp->v_type, cnp->cn_cred, ip->i_uid,
386 1.299 dholland ip->i_gid, MAKEIMODE(vap->va_type, vap->va_mode)));
387 1.299 dholland if (error) {
388 1.299 dholland ip->i_mode &= ~ISGID;
389 1.299 dholland DIP_ASSIGN(ip, mode, ip->i_mode);
390 1.299 dholland }
391 1.299 dholland }
392 1.299 dholland
393 1.299 dholland if (cnp->cn_flags & ISWHITEOUT) {
394 1.299 dholland ip->i_flags |= UF_OPAQUE;
395 1.299 dholland DIP_ASSIGN(ip, flags, ip->i_flags);
396 1.299 dholland }
397 1.299 dholland
398 1.299 dholland /*
399 1.299 dholland * Make sure inode goes to disk before directory entry.
400 1.299 dholland */
401 1.299 dholland if ((error = lfs_update(tvp, NULL, NULL, UPDATE_DIROP)) != 0)
402 1.299 dholland goto bad;
403 1.299 dholland error = ulfs_direnter(dvp, ulr, tvp,
404 1.299 dholland cnp, ip->i_number, LFS_IFTODT(ip->i_mode), NULL);
405 1.299 dholland if (error)
406 1.299 dholland goto bad;
407 1.299 dholland *vpp = tvp;
408 1.325 christos cache_enter(dvp, *vpp, cnp->cn_nameptr, cnp->cn_namelen, cnp->cn_flags);
409 1.311 riastrad KASSERT(VOP_ISLOCKED(*vpp) == LK_EXCLUSIVE);
410 1.299 dholland return (0);
411 1.299 dholland
412 1.299 dholland bad:
413 1.299 dholland /*
414 1.299 dholland * Write error occurred trying to update the inode
415 1.299 dholland * or the directory so must deallocate the inode.
416 1.299 dholland */
417 1.299 dholland ip->i_nlink = 0;
418 1.299 dholland DIP_ASSIGN(ip, nlink, 0);
419 1.317 maya ip->i_state |= IN_CHANGE;
420 1.299 dholland /* If IN_ADIROP, account for it */
421 1.319 maya UNMARK_VNODE(tvp);
422 1.299 dholland vput(tvp);
423 1.299 dholland return (error);
424 1.299 dholland }
425 1.299 dholland
426 1.299 dholland /*
427 1.1 mycroft * Synch an open file.
428 1.1 mycroft */
429 1.1 mycroft /* ARGSUSED */
430 1.10 christos int
431 1.51 perseant lfs_fsync(void *v)
432 1.10 christos {
433 1.1 mycroft struct vop_fsync_args /* {
434 1.1 mycroft struct vnode *a_vp;
435 1.176 elad kauth_cred_t a_cred;
436 1.22 perseant int a_flags;
437 1.49 toshii off_t offlo;
438 1.49 toshii off_t offhi;
439 1.10 christos } */ *ap = v;
440 1.60 chs struct vnode *vp = ap->a_vp;
441 1.311 riastrad int wait;
442 1.203 perseant struct inode *ip = VTOI(vp);
443 1.203 perseant struct lfs *fs = ip->i_lfs;
444 1.311 riastrad int error = 0;
445 1.311 riastrad
446 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
447 1.84 perseant
448 1.161 perseant /* If we're mounted read-only, don't try to sync. */
449 1.203 perseant if (fs->lfs_ronly)
450 1.311 riastrad goto out;
451 1.161 perseant
452 1.231 hannken /* If a removed vnode is being cleaned, no need to sync here. */
453 1.231 hannken if ((ap->a_flags & FSYNC_RECLAIM) != 0 && ip->i_mode == 0)
454 1.311 riastrad goto out;
455 1.231 hannken
456 1.86 perseant /*
457 1.203 perseant * Trickle sync simply adds this vnode to the pager list, as if
458 1.203 perseant * the pagedaemon had requested a pageout.
459 1.86 perseant */
460 1.84 perseant if (ap->a_flags & FSYNC_LAZY) {
461 1.203 perseant if (lfs_ignore_lazy_sync == 0) {
462 1.214 ad mutex_enter(&lfs_lock);
463 1.317 maya if (!(ip->i_state & IN_PAGING)) {
464 1.317 maya ip->i_state |= IN_PAGING;
465 1.203 perseant TAILQ_INSERT_TAIL(&fs->lfs_pchainhd, ip,
466 1.203 perseant i_lfs_pchain);
467 1.203 perseant }
468 1.310 maya cv_broadcast(&lfs_writerd_cv);
469 1.214 ad mutex_exit(&lfs_lock);
470 1.203 perseant }
471 1.311 riastrad goto out;
472 1.84 perseant }
473 1.47 perseant
474 1.175 perseant /*
475 1.321 maya * If a vnode is being cleaned, flush it out before we try to
476 1.188 perseant * reuse it. This prevents the cleaner from writing files twice
477 1.188 perseant * in the same partial segment, causing an accounting underflow.
478 1.188 perseant */
479 1.317 maya if (ap->a_flags & FSYNC_RECLAIM && ip->i_state & IN_CLEANING) {
480 1.188 perseant lfs_vflush(vp);
481 1.175 perseant }
482 1.175 perseant
483 1.84 perseant wait = (ap->a_flags & FSYNC_WAIT);
484 1.203 perseant do {
485 1.235 rmind mutex_enter(vp->v_interlock);
486 1.203 perseant error = VOP_PUTPAGES(vp, trunc_page(ap->a_offlo),
487 1.203 perseant round_page(ap->a_offhi),
488 1.203 perseant PGO_CLEANIT | (wait ? PGO_SYNCIO : 0));
489 1.205 perseant if (error == EAGAIN) {
490 1.214 ad mutex_enter(&lfs_lock);
491 1.274 dholland mtsleep(&fs->lfs_availsleep, PCATCH | PUSER,
492 1.274 dholland "lfs_fsync", hz / 100 + 1, &lfs_lock);
493 1.214 ad mutex_exit(&lfs_lock);
494 1.205 perseant }
495 1.203 perseant } while (error == EAGAIN);
496 1.103 perseant if (error)
497 1.311 riastrad goto out;
498 1.203 perseant
499 1.203 perseant if ((ap->a_flags & FSYNC_DATAONLY) == 0)
500 1.203 perseant error = lfs_update(vp, NULL, NULL, wait ? UPDATE_WAIT : 0);
501 1.203 perseant
502 1.133 wrstuden if (error == 0 && ap->a_flags & FSYNC_CACHE) {
503 1.133 wrstuden int l = 0;
504 1.203 perseant error = VOP_IOCTL(ip->i_devvp, DIOCCACHESYNC, &l, FWRITE,
505 1.213 pooka curlwp->l_cred);
506 1.133 wrstuden }
507 1.103 perseant if (wait && !VPISEMPTY(vp))
508 1.203 perseant LFS_SET_UINO(ip, IN_MODIFIED);
509 1.84 perseant
510 1.311 riastrad out:
511 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
512 1.63 perseant return error;
513 1.1 mycroft }
514 1.1 mycroft
515 1.1 mycroft /*
516 1.245 dholland * Take IN_ADIROP off, then call ulfs_inactive.
517 1.40 perseant */
518 1.40 perseant int
519 1.51 perseant lfs_inactive(void *v)
520 1.40 perseant {
521 1.313 riastrad struct vop_inactive_v2_args /* {
522 1.40 perseant struct vnode *a_vp;
523 1.313 riastrad bool *a_recycle;
524 1.40 perseant } */ *ap = v;
525 1.72 yamt
526 1.311 riastrad KASSERT(VOP_ISLOCKED(ap->a_vp) == LK_EXCLUSIVE);
527 1.311 riastrad
528 1.319 maya UNMARK_VNODE(ap->a_vp);
529 1.76 yamt
530 1.97 perseant /*
531 1.97 perseant * The Ifile is only ever inactivated on unmount.
532 1.97 perseant * Streamline this process by not giving it more dirty blocks.
533 1.97 perseant */
534 1.97 perseant if (VTOI(ap->a_vp)->i_number == LFS_IFILE_INUM) {
535 1.214 ad mutex_enter(&lfs_lock);
536 1.97 perseant LFS_CLR_UINO(VTOI(ap->a_vp), IN_ALLMOD);
537 1.214 ad mutex_exit(&lfs_lock);
538 1.97 perseant return 0;
539 1.97 perseant }
540 1.97 perseant
541 1.239 perseant #ifdef DEBUG
542 1.239 perseant /*
543 1.239 perseant * This might happen on unmount.
544 1.239 perseant * XXX If it happens at any other time, it should be a panic.
545 1.239 perseant */
546 1.239 perseant if (ap->a_vp->v_uflag & VU_DIROP) {
547 1.239 perseant struct inode *ip = VTOI(ap->a_vp);
548 1.306 maya printf("lfs_inactive: inactivating VU_DIROP? ino = %llu\n",
549 1.306 maya (unsigned long long) ip->i_number);
550 1.239 perseant }
551 1.239 perseant #endif /* DIAGNOSTIC */
552 1.239 perseant
553 1.245 dholland return ulfs_inactive(v);
554 1.40 perseant }
555 1.40 perseant
556 1.249 dholland int
557 1.138 perseant lfs_set_dirop(struct vnode *dvp, struct vnode *vp)
558 1.40 perseant {
559 1.24 perseant struct lfs *fs;
560 1.24 perseant int error;
561 1.24 perseant
562 1.311 riastrad KASSERT(VOP_ISLOCKED(dvp) == LK_EXCLUSIVE);
563 1.311 riastrad KASSERT(vp == NULL || VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
564 1.71 yamt
565 1.138 perseant fs = VTOI(dvp)->i_lfs;
566 1.141 perseant
567 1.141 perseant ASSERT_NO_SEGLOCK(fs);
568 1.44 perseant /*
569 1.134 perseant * LFS_NRESERVE calculates direct and indirect blocks as well
570 1.134 perseant * as an inode block; an overestimate in most cases.
571 1.44 perseant */
572 1.138 perseant if ((error = lfs_reserve(fs, dvp, vp, LFS_NRESERVE(fs))) != 0)
573 1.44 perseant return (error);
574 1.70 yamt
575 1.214 ad restart:
576 1.214 ad mutex_enter(&lfs_lock);
577 1.141 perseant if (fs->lfs_dirops == 0) {
578 1.214 ad mutex_exit(&lfs_lock);
579 1.138 perseant lfs_check(dvp, LFS_UNUSED_LBN, 0);
580 1.214 ad mutex_enter(&lfs_lock);
581 1.113 yamt }
582 1.190 perseant while (fs->lfs_writer) {
583 1.309 maya error = cv_wait_sig(&fs->lfs_diropscv, &lfs_lock);
584 1.190 perseant if (error == EINTR) {
585 1.214 ad mutex_exit(&lfs_lock);
586 1.190 perseant goto unreserve;
587 1.190 perseant }
588 1.190 perseant }
589 1.113 yamt if (lfs_dirvcount > LFS_MAX_DIROP && fs->lfs_dirops == 0) {
590 1.310 maya cv_broadcast(&lfs_writerd_cv);
591 1.214 ad mutex_exit(&lfs_lock);
592 1.198 ad preempt();
593 1.113 yamt goto restart;
594 1.113 yamt }
595 1.33 perseant
596 1.113 yamt if (lfs_dirvcount > LFS_MAX_DIROP) {
597 1.136 perseant DLOG((DLOG_DIROP, "lfs_set_dirop: sleeping with dirops=%d, "
598 1.136 perseant "dirvcount=%d\n", fs->lfs_dirops, lfs_dirvcount));
599 1.214 ad if ((error = mtsleep(&lfs_dirvcount,
600 1.214 ad PCATCH | PUSER | PNORELOCK, "lfs_maxdirop", 0,
601 1.214 ad &lfs_lock)) != 0) {
602 1.304 maya mutex_exit(&lfs_lock);
603 1.113 yamt goto unreserve;
604 1.113 yamt }
605 1.304 maya mutex_exit(&lfs_lock);
606 1.113 yamt goto restart;
607 1.135 perry }
608 1.113 yamt
609 1.135 perry ++fs->lfs_dirops;
610 1.239 perseant /* fs->lfs_doifile = 1; */ /* XXX why? --ks */
611 1.214 ad mutex_exit(&lfs_lock);
612 1.24 perseant
613 1.46 perseant /* Hold a reference so SET_ENDOP will be happy */
614 1.138 perseant vref(dvp);
615 1.138 perseant if (vp) {
616 1.138 perseant vref(vp);
617 1.138 perseant MARK_VNODE(vp);
618 1.138 perseant }
619 1.46 perseant
620 1.138 perseant MARK_VNODE(dvp);
621 1.24 perseant return 0;
622 1.70 yamt
623 1.203 perseant unreserve:
624 1.138 perseant lfs_reserve(fs, dvp, vp, -LFS_NRESERVE(fs));
625 1.70 yamt return error;
626 1.1 mycroft }
627 1.1 mycroft
628 1.138 perseant /*
629 1.264 dholland * Opposite of lfs_set_dirop... mostly. For now at least must call
630 1.264 dholland * UNMARK_VNODE(dvp) explicitly first. (XXX: clean that up)
631 1.138 perseant */
632 1.264 dholland void
633 1.264 dholland lfs_unset_dirop(struct lfs *fs, struct vnode *dvp, const char *str)
634 1.138 perseant {
635 1.264 dholland mutex_enter(&lfs_lock);
636 1.264 dholland --fs->lfs_dirops;
637 1.264 dholland if (!fs->lfs_dirops) {
638 1.264 dholland if (fs->lfs_nadirop) {
639 1.264 dholland panic("lfs_unset_dirop: %s: no dirops but "
640 1.264 dholland " nadirop=%d", str,
641 1.264 dholland fs->lfs_nadirop);
642 1.264 dholland }
643 1.264 dholland wakeup(&fs->lfs_writer);
644 1.264 dholland mutex_exit(&lfs_lock);
645 1.264 dholland lfs_check(dvp, LFS_UNUSED_LBN, 0);
646 1.264 dholland } else {
647 1.264 dholland mutex_exit(&lfs_lock);
648 1.138 perseant }
649 1.264 dholland lfs_reserve(fs, dvp, NULL, -LFS_NRESERVE(fs));
650 1.1 mycroft }
651 1.1 mycroft
652 1.117 yamt void
653 1.117 yamt lfs_mark_vnode(struct vnode *vp)
654 1.117 yamt {
655 1.117 yamt struct inode *ip = VTOI(vp);
656 1.117 yamt struct lfs *fs = ip->i_lfs;
657 1.37 perseant
658 1.214 ad mutex_enter(&lfs_lock);
659 1.317 maya if (!(ip->i_state & IN_ADIROP)) {
660 1.212 ad if (!(vp->v_uflag & VU_DIROP)) {
661 1.240 perseant mutex_exit(&lfs_lock);
662 1.272 hannken vref(vp);
663 1.240 perseant mutex_enter(&lfs_lock);
664 1.117 yamt ++lfs_dirvcount;
665 1.173 perseant ++fs->lfs_dirvcount;
666 1.117 yamt TAILQ_INSERT_TAIL(&fs->lfs_dchainhd, ip, i_lfs_dchain);
667 1.212 ad vp->v_uflag |= VU_DIROP;
668 1.117 yamt }
669 1.117 yamt ++fs->lfs_nadirop;
670 1.317 maya ip->i_state &= ~IN_CDIROP;
671 1.317 maya ip->i_state |= IN_ADIROP;
672 1.117 yamt } else
673 1.212 ad KASSERT(vp->v_uflag & VU_DIROP);
674 1.214 ad mutex_exit(&lfs_lock);
675 1.117 yamt }
676 1.40 perseant
677 1.117 yamt void
678 1.117 yamt lfs_unmark_vnode(struct vnode *vp)
679 1.40 perseant {
680 1.117 yamt struct inode *ip = VTOI(vp);
681 1.40 perseant
682 1.240 perseant mutex_enter(&lfs_lock);
683 1.317 maya if (ip && (ip->i_state & IN_ADIROP)) {
684 1.212 ad KASSERT(vp->v_uflag & VU_DIROP);
685 1.40 perseant --ip->i_lfs->lfs_nadirop;
686 1.317 maya ip->i_state &= ~IN_ADIROP;
687 1.117 yamt }
688 1.240 perseant mutex_exit(&lfs_lock);
689 1.40 perseant }
690 1.15 fvdl
691 1.1 mycroft int
692 1.51 perseant lfs_symlink(void *v)
693 1.10 christos {
694 1.261 hannken struct vop_symlink_v3_args /* {
695 1.1 mycroft struct vnode *a_dvp;
696 1.1 mycroft struct vnode **a_vpp;
697 1.1 mycroft struct componentname *a_cnp;
698 1.1 mycroft struct vattr *a_vap;
699 1.1 mycroft char *a_target;
700 1.10 christos } */ *ap = v;
701 1.264 dholland struct lfs *fs;
702 1.264 dholland struct vnode *dvp, **vpp;
703 1.266 dholland struct inode *ip;
704 1.266 dholland struct ulfs_lookup_results *ulr;
705 1.266 dholland ssize_t len; /* XXX should be size_t */
706 1.37 perseant int error;
707 1.1 mycroft
708 1.264 dholland dvp = ap->a_dvp;
709 1.264 dholland vpp = ap->a_vpp;
710 1.264 dholland
711 1.311 riastrad KASSERT(VOP_ISLOCKED(dvp) == LK_EXCLUSIVE);
712 1.264 dholland KASSERT(vpp != NULL);
713 1.264 dholland KASSERT(*vpp == NULL);
714 1.272 hannken KASSERT(ap->a_vap->va_type == VLNK);
715 1.264 dholland
716 1.266 dholland /* XXX should handle this material another way */
717 1.266 dholland ulr = &VTOI(ap->a_dvp)->i_crap;
718 1.266 dholland ULFS_CHECK_CRAPCOUNTER(VTOI(ap->a_dvp));
719 1.266 dholland
720 1.264 dholland fs = VFSTOULFS(dvp->v_mount)->um_lfs;
721 1.264 dholland ASSERT_NO_SEGLOCK(fs);
722 1.264 dholland if (fs->lfs_ronly) {
723 1.264 dholland return EROFS;
724 1.264 dholland }
725 1.264 dholland
726 1.264 dholland error = lfs_set_dirop(dvp, NULL);
727 1.272 hannken if (error)
728 1.37 perseant return error;
729 1.264 dholland
730 1.300 dholland error = lfs_makeinode(ap->a_vap, dvp, ulr, vpp, ap->a_cnp);
731 1.266 dholland if (error) {
732 1.266 dholland goto out;
733 1.266 dholland }
734 1.311 riastrad KASSERT(VOP_ISLOCKED(*vpp) == LK_EXCLUSIVE);
735 1.266 dholland
736 1.266 dholland VN_KNOTE(ap->a_dvp, NOTE_WRITE);
737 1.266 dholland ip = VTOI(*vpp);
738 1.266 dholland
739 1.294 dholland /*
740 1.294 dholland * This test is off by one. um_maxsymlinklen contains the
741 1.294 dholland * number of bytes available, and we aren't storing a \0, so
742 1.294 dholland * the test should properly be <=. However, it cannot be
743 1.294 dholland * changed as this would break compatibility with existing fs
744 1.294 dholland * images -- see the way ulfs_readlink() works.
745 1.294 dholland */
746 1.266 dholland len = strlen(ap->a_target);
747 1.266 dholland if (len < ip->i_lfs->um_maxsymlinklen) {
748 1.266 dholland memcpy((char *)SHORTLINK(ip), ap->a_target, len);
749 1.266 dholland ip->i_size = len;
750 1.266 dholland DIP_ASSIGN(ip, size, len);
751 1.266 dholland uvm_vnp_setsize(*vpp, ip->i_size);
752 1.317 maya ip->i_state |= IN_CHANGE | IN_UPDATE;
753 1.266 dholland if ((*vpp)->v_mount->mnt_flag & MNT_RELATIME)
754 1.317 maya ip->i_state |= IN_ACCESS;
755 1.266 dholland } else {
756 1.270 riastrad error = ulfs_bufio(UIO_WRITE, *vpp, ap->a_target, len, (off_t)0,
757 1.270 riastrad IO_NODELOCKED | IO_JOURNALLOCKED, ap->a_cnp->cn_cred, NULL,
758 1.270 riastrad NULL);
759 1.266 dholland }
760 1.266 dholland
761 1.266 dholland VOP_UNLOCK(*vpp);
762 1.266 dholland if (error)
763 1.266 dholland vrele(*vpp);
764 1.266 dholland
765 1.266 dholland out:
766 1.264 dholland UNMARK_VNODE(dvp);
767 1.264 dholland /* XXX: is it even possible for the symlink to get MARK'd? */
768 1.264 dholland UNMARK_VNODE(*vpp);
769 1.281 dholland if (error) {
770 1.264 dholland *vpp = NULL;
771 1.264 dholland }
772 1.264 dholland lfs_unset_dirop(fs, dvp, "symlink");
773 1.264 dholland
774 1.264 dholland vrele(dvp);
775 1.37 perseant return (error);
776 1.1 mycroft }
777 1.1 mycroft
778 1.1 mycroft int
779 1.51 perseant lfs_mknod(void *v)
780 1.10 christos {
781 1.261 hannken struct vop_mknod_v3_args /* {
782 1.1 mycroft struct vnode *a_dvp;
783 1.1 mycroft struct vnode **a_vpp;
784 1.1 mycroft struct componentname *a_cnp;
785 1.1 mycroft struct vattr *a_vap;
786 1.203 perseant } */ *ap = v;
787 1.264 dholland struct lfs *fs;
788 1.264 dholland struct vnode *dvp, **vpp;
789 1.250 dholland struct vattr *vap;
790 1.86 perseant struct inode *ip;
791 1.86 perseant int error;
792 1.52 assar ino_t ino;
793 1.245 dholland struct ulfs_lookup_results *ulr;
794 1.237 dholland
795 1.264 dholland dvp = ap->a_dvp;
796 1.264 dholland vpp = ap->a_vpp;
797 1.250 dholland vap = ap->a_vap;
798 1.250 dholland
799 1.311 riastrad KASSERT(VOP_ISLOCKED(dvp) == LK_EXCLUSIVE);
800 1.264 dholland KASSERT(vpp != NULL);
801 1.264 dholland KASSERT(*vpp == NULL);
802 1.311 riastrad
803 1.237 dholland /* XXX should handle this material another way */
804 1.264 dholland ulr = &VTOI(dvp)->i_crap;
805 1.264 dholland ULFS_CHECK_CRAPCOUNTER(VTOI(dvp));
806 1.264 dholland
807 1.264 dholland fs = VFSTOULFS(dvp->v_mount)->um_lfs;
808 1.264 dholland ASSERT_NO_SEGLOCK(fs);
809 1.264 dholland if (fs->lfs_ronly) {
810 1.264 dholland return EROFS;
811 1.264 dholland }
812 1.264 dholland
813 1.264 dholland error = lfs_set_dirop(dvp, NULL);
814 1.272 hannken if (error)
815 1.28 perseant return error;
816 1.250 dholland
817 1.300 dholland error = lfs_makeinode(vap, dvp, ulr, vpp, ap->a_cnp);
818 1.28 perseant
819 1.28 perseant /* Either way we're done with the dirop at this point */
820 1.264 dholland UNMARK_VNODE(dvp);
821 1.264 dholland UNMARK_VNODE(*vpp);
822 1.264 dholland lfs_unset_dirop(fs, dvp, "mknod");
823 1.28 perseant
824 1.250 dholland if (error) {
825 1.303 dholland vrele(dvp);
826 1.250 dholland *vpp = NULL;
827 1.28 perseant return (error);
828 1.250 dholland }
829 1.311 riastrad KASSERT(VOP_ISLOCKED(*vpp) == LK_EXCLUSIVE);
830 1.28 perseant
831 1.264 dholland VN_KNOTE(dvp, NOTE_WRITE);
832 1.86 perseant ip = VTOI(*vpp);
833 1.52 assar ino = ip->i_number;
834 1.317 maya ip->i_state |= IN_ACCESS | IN_CHANGE | IN_UPDATE;
835 1.134 perseant
836 1.28 perseant /*
837 1.28 perseant * Call fsync to write the vnode so that we don't have to deal with
838 1.262 hannken * flushing it when it's marked VU_DIROP or reclaiming.
839 1.28 perseant *
840 1.28 perseant * XXX KS - If we can't flush we also can't call vgone(), so must
841 1.28 perseant * return. But, that leaves this vnode in limbo, also not good.
842 1.28 perseant * Can this ever happen (barring hardware failure)?
843 1.28 perseant */
844 1.213 pooka if ((error = VOP_FSYNC(*vpp, NOCRED, FSYNC_WAIT, 0, 0)) != 0) {
845 1.306 maya panic("lfs_mknod: couldn't fsync (ino %llu)",
846 1.306 maya (unsigned long long) ino);
847 1.136 perseant /* return (error); */
848 1.40 perseant }
849 1.134 perseant
850 1.303 dholland vrele(dvp);
851 1.273 hannken KASSERT(error == 0);
852 1.261 hannken VOP_UNLOCK(*vpp);
853 1.86 perseant return (0);
854 1.1 mycroft }
855 1.1 mycroft
856 1.265 dholland /*
857 1.265 dholland * Create a regular file
858 1.265 dholland */
859 1.265 dholland int
860 1.51 perseant lfs_create(void *v)
861 1.10 christos {
862 1.261 hannken struct vop_create_v3_args /* {
863 1.1 mycroft struct vnode *a_dvp;
864 1.1 mycroft struct vnode **a_vpp;
865 1.1 mycroft struct componentname *a_cnp;
866 1.1 mycroft struct vattr *a_vap;
867 1.10 christos } */ *ap = v;
868 1.264 dholland struct lfs *fs;
869 1.264 dholland struct vnode *dvp, **vpp;
870 1.268 dholland struct vattr *vap;
871 1.268 dholland struct ulfs_lookup_results *ulr;
872 1.37 perseant int error;
873 1.1 mycroft
874 1.264 dholland dvp = ap->a_dvp;
875 1.264 dholland vpp = ap->a_vpp;
876 1.268 dholland vap = ap->a_vap;
877 1.264 dholland
878 1.311 riastrad KASSERT(VOP_ISLOCKED(dvp) == LK_EXCLUSIVE);
879 1.264 dholland KASSERT(vpp != NULL);
880 1.264 dholland KASSERT(*vpp == NULL);
881 1.264 dholland
882 1.268 dholland /* XXX should handle this material another way */
883 1.268 dholland ulr = &VTOI(dvp)->i_crap;
884 1.268 dholland ULFS_CHECK_CRAPCOUNTER(VTOI(dvp));
885 1.268 dholland
886 1.264 dholland fs = VFSTOULFS(dvp->v_mount)->um_lfs;
887 1.264 dholland ASSERT_NO_SEGLOCK(fs);
888 1.264 dholland if (fs->lfs_ronly) {
889 1.264 dholland return EROFS;
890 1.264 dholland }
891 1.264 dholland
892 1.264 dholland error = lfs_set_dirop(dvp, NULL);
893 1.272 hannken if (error)
894 1.37 perseant return error;
895 1.264 dholland
896 1.300 dholland error = lfs_makeinode(vap, dvp, ulr, vpp, ap->a_cnp);
897 1.268 dholland if (error) {
898 1.268 dholland goto out;
899 1.268 dholland }
900 1.311 riastrad KASSERT(VOP_ISLOCKED(*vpp) == LK_EXCLUSIVE);
901 1.268 dholland VN_KNOTE(dvp, NOTE_WRITE);
902 1.268 dholland VOP_UNLOCK(*vpp);
903 1.268 dholland
904 1.268 dholland out:
905 1.264 dholland
906 1.264 dholland UNMARK_VNODE(dvp);
907 1.264 dholland UNMARK_VNODE(*vpp);
908 1.281 dholland if (error) {
909 1.264 dholland *vpp = NULL;
910 1.264 dholland }
911 1.264 dholland lfs_unset_dirop(fs, dvp, "create");
912 1.264 dholland
913 1.264 dholland vrele(dvp);
914 1.37 perseant return (error);
915 1.22 perseant }
916 1.22 perseant
917 1.22 perseant int
918 1.267 dholland lfs_mkdir(void *v)
919 1.265 dholland {
920 1.267 dholland struct vop_mkdir_v3_args /* {
921 1.267 dholland struct vnode *a_dvp;
922 1.267 dholland struct vnode **a_vpp;
923 1.267 dholland struct componentname *a_cnp;
924 1.267 dholland struct vattr *a_vap;
925 1.265 dholland } */ *ap = v;
926 1.267 dholland struct lfs *fs;
927 1.267 dholland struct vnode *dvp, *tvp, **vpp;
928 1.267 dholland struct inode *dp, *ip;
929 1.267 dholland struct componentname *cnp;
930 1.267 dholland struct vattr *vap;
931 1.265 dholland struct ulfs_lookup_results *ulr;
932 1.267 dholland struct buf *bp;
933 1.293 dholland LFS_DIRHEADER *dirp;
934 1.267 dholland int dirblksiz;
935 1.267 dholland int error;
936 1.265 dholland
937 1.267 dholland dvp = ap->a_dvp;
938 1.267 dholland tvp = NULL;
939 1.267 dholland vpp = ap->a_vpp;
940 1.267 dholland cnp = ap->a_cnp;
941 1.267 dholland vap = ap->a_vap;
942 1.267 dholland
943 1.311 riastrad KASSERT(VOP_ISLOCKED(dvp) == LK_EXCLUSIVE);
944 1.311 riastrad
945 1.267 dholland dp = VTOI(dvp);
946 1.267 dholland ip = NULL;
947 1.267 dholland
948 1.272 hannken KASSERT(vap->va_type == VDIR);
949 1.267 dholland KASSERT(vpp != NULL);
950 1.267 dholland KASSERT(*vpp == NULL);
951 1.265 dholland
952 1.265 dholland /* XXX should handle this material another way */
953 1.265 dholland ulr = &dp->i_crap;
954 1.265 dholland ULFS_CHECK_CRAPCOUNTER(dp);
955 1.265 dholland
956 1.267 dholland fs = VFSTOULFS(dvp->v_mount)->um_lfs;
957 1.267 dholland ASSERT_NO_SEGLOCK(fs);
958 1.267 dholland if (fs->lfs_ronly) {
959 1.267 dholland return EROFS;
960 1.267 dholland }
961 1.322 zafer
962 1.322 zafer if ((nlink_t)dp->i_nlink >= LINK_MAX) {
963 1.322 zafer return EMLINK;
964 1.322 zafer }
965 1.322 zafer
966 1.267 dholland dirblksiz = fs->um_dirblksiz;
967 1.291 dholland /* XXX dholland 20150911 I believe this to be true, but... */
968 1.291 dholland //KASSERT(dirblksiz == LFS_DIRBLKSIZ);
969 1.267 dholland
970 1.267 dholland error = lfs_set_dirop(dvp, NULL);
971 1.272 hannken if (error)
972 1.267 dholland return error;
973 1.267 dholland
974 1.265 dholland /*
975 1.300 dholland * Must simulate part of lfs_makeinode here to acquire the inode,
976 1.265 dholland * but not have it entered in the parent directory. The entry is
977 1.265 dholland * made later after writing "." and ".." entries.
978 1.265 dholland */
979 1.323 hannken error = vcache_new(dvp->v_mount, dvp, vap, cnp->cn_cred, NULL,
980 1.323 hannken ap->a_vpp);
981 1.272 hannken if (error)
982 1.272 hannken goto out;
983 1.272 hannken
984 1.272 hannken error = vn_lock(*ap->a_vpp, LK_EXCLUSIVE);
985 1.272 hannken if (error) {
986 1.272 hannken vrele(*ap->a_vpp);
987 1.272 hannken *ap->a_vpp = NULL;
988 1.265 dholland goto out;
989 1.272 hannken }
990 1.265 dholland
991 1.272 hannken tvp = *ap->a_vpp;
992 1.319 maya MARK_VNODE(tvp);
993 1.265 dholland ip = VTOI(tvp);
994 1.317 maya ip->i_state |= IN_ACCESS | IN_CHANGE | IN_UPDATE;
995 1.265 dholland ip->i_nlink = 2;
996 1.265 dholland DIP_ASSIGN(ip, nlink, 2);
997 1.265 dholland if (cnp->cn_flags & ISWHITEOUT) {
998 1.265 dholland ip->i_flags |= UF_OPAQUE;
999 1.265 dholland DIP_ASSIGN(ip, flags, ip->i_flags);
1000 1.265 dholland }
1001 1.265 dholland
1002 1.265 dholland /*
1003 1.265 dholland * Bump link count in parent directory to reflect work done below.
1004 1.265 dholland */
1005 1.265 dholland dp->i_nlink++;
1006 1.265 dholland DIP_ASSIGN(dp, nlink, dp->i_nlink);
1007 1.317 maya dp->i_state |= IN_CHANGE;
1008 1.265 dholland if ((error = lfs_update(dvp, NULL, NULL, UPDATE_DIROP)) != 0)
1009 1.265 dholland goto bad;
1010 1.265 dholland
1011 1.265 dholland /*
1012 1.291 dholland * Initialize directory with "." and "..". This used to use a
1013 1.291 dholland * static template but that adds moving parts for very little
1014 1.291 dholland * benefit.
1015 1.265 dholland */
1016 1.265 dholland if ((error = lfs_balloc(tvp, (off_t)0, dirblksiz, cnp->cn_cred,
1017 1.265 dholland B_CLRBUF, &bp)) != 0)
1018 1.265 dholland goto bad;
1019 1.265 dholland ip->i_size = dirblksiz;
1020 1.265 dholland DIP_ASSIGN(ip, size, dirblksiz);
1021 1.317 maya ip->i_state |= IN_ACCESS | IN_CHANGE | IN_UPDATE;
1022 1.265 dholland uvm_vnp_setsize(tvp, ip->i_size);
1023 1.291 dholland dirp = bp->b_data;
1024 1.291 dholland
1025 1.291 dholland /* . */
1026 1.291 dholland lfs_dir_setino(fs, dirp, ip->i_number);
1027 1.292 dholland lfs_dir_setreclen(fs, dirp, LFS_DIRECTSIZ(fs, 1));
1028 1.291 dholland lfs_dir_settype(fs, dirp, LFS_DT_DIR);
1029 1.291 dholland lfs_dir_setnamlen(fs, dirp, 1);
1030 1.291 dholland lfs_copydirname(fs, lfs_dir_nameptr(fs, dirp), ".", 1,
1031 1.292 dholland LFS_DIRECTSIZ(fs, 1));
1032 1.291 dholland dirp = LFS_NEXTDIR(fs, dirp);
1033 1.291 dholland /* .. */
1034 1.291 dholland lfs_dir_setino(fs, dirp, dp->i_number);
1035 1.292 dholland lfs_dir_setreclen(fs, dirp, dirblksiz - LFS_DIRECTSIZ(fs, 1));
1036 1.291 dholland lfs_dir_settype(fs, dirp, LFS_DT_DIR);
1037 1.291 dholland lfs_dir_setnamlen(fs, dirp, 2);
1038 1.291 dholland lfs_copydirname(fs, lfs_dir_nameptr(fs, dirp), "..", 2,
1039 1.292 dholland dirblksiz - LFS_DIRECTSIZ(fs, 1));
1040 1.265 dholland
1041 1.265 dholland /*
1042 1.267 dholland * Directory set up; now install its entry in the parent directory.
1043 1.265 dholland */
1044 1.265 dholland if ((error = VOP_BWRITE(bp->b_vp, bp)) != 0)
1045 1.265 dholland goto bad;
1046 1.265 dholland if ((error = lfs_update(tvp, NULL, NULL, UPDATE_DIROP)) != 0) {
1047 1.265 dholland goto bad;
1048 1.265 dholland }
1049 1.290 dholland error = ulfs_direnter(dvp, ulr, tvp,
1050 1.290 dholland cnp, ip->i_number, LFS_IFTODT(ip->i_mode), bp);
1051 1.265 dholland bad:
1052 1.265 dholland if (error == 0) {
1053 1.265 dholland VN_KNOTE(dvp, NOTE_WRITE | NOTE_LINK);
1054 1.265 dholland VOP_UNLOCK(tvp);
1055 1.265 dholland } else {
1056 1.265 dholland dp->i_nlink--;
1057 1.265 dholland DIP_ASSIGN(dp, nlink, dp->i_nlink);
1058 1.317 maya dp->i_state |= IN_CHANGE;
1059 1.265 dholland /*
1060 1.265 dholland * No need to do an explicit lfs_truncate here, vrele will
1061 1.265 dholland * do this for us because we set the link count to 0.
1062 1.265 dholland */
1063 1.265 dholland ip->i_nlink = 0;
1064 1.265 dholland DIP_ASSIGN(ip, nlink, 0);
1065 1.317 maya ip->i_state |= IN_CHANGE;
1066 1.265 dholland /* If IN_ADIROP, account for it */
1067 1.319 maya UNMARK_VNODE(tvp);
1068 1.265 dholland vput(tvp);
1069 1.265 dholland }
1070 1.267 dholland
1071 1.267 dholland out:
1072 1.264 dholland UNMARK_VNODE(dvp);
1073 1.264 dholland UNMARK_VNODE(*vpp);
1074 1.281 dholland if (error) {
1075 1.264 dholland *vpp = NULL;
1076 1.264 dholland }
1077 1.264 dholland lfs_unset_dirop(fs, dvp, "mkdir");
1078 1.264 dholland
1079 1.264 dholland vrele(dvp);
1080 1.37 perseant return (error);
1081 1.1 mycroft }
1082 1.1 mycroft
1083 1.1 mycroft int
1084 1.51 perseant lfs_remove(void *v)
1085 1.10 christos {
1086 1.314 riastrad struct vop_remove_v2_args /* {
1087 1.1 mycroft struct vnode *a_dvp;
1088 1.1 mycroft struct vnode *a_vp;
1089 1.1 mycroft struct componentname *a_cnp;
1090 1.10 christos } */ *ap = v;
1091 1.34 perseant struct vnode *dvp, *vp;
1092 1.188 perseant struct inode *ip;
1093 1.37 perseant int error;
1094 1.34 perseant
1095 1.34 perseant dvp = ap->a_dvp;
1096 1.34 perseant vp = ap->a_vp;
1097 1.311 riastrad
1098 1.311 riastrad KASSERT(VOP_ISLOCKED(dvp) == LK_EXCLUSIVE);
1099 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
1100 1.311 riastrad
1101 1.188 perseant ip = VTOI(vp);
1102 1.264 dholland if ((error = lfs_set_dirop(dvp, vp)) != 0) {
1103 1.34 perseant if (dvp == vp)
1104 1.34 perseant vrele(vp);
1105 1.34 perseant else
1106 1.34 perseant vput(vp);
1107 1.37 perseant return error;
1108 1.34 perseant }
1109 1.245 dholland error = ulfs_remove(ap);
1110 1.188 perseant if (ip->i_nlink == 0)
1111 1.188 perseant lfs_orphan(ip->i_lfs, ip->i_number);
1112 1.264 dholland
1113 1.264 dholland UNMARK_VNODE(dvp);
1114 1.264 dholland if (ap->a_vp) {
1115 1.264 dholland UNMARK_VNODE(ap->a_vp);
1116 1.264 dholland }
1117 1.264 dholland lfs_unset_dirop(ip->i_lfs, dvp, "remove");
1118 1.264 dholland vrele(dvp);
1119 1.264 dholland if (ap->a_vp) {
1120 1.264 dholland vrele(ap->a_vp);
1121 1.264 dholland }
1122 1.264 dholland
1123 1.37 perseant return (error);
1124 1.1 mycroft }
1125 1.1 mycroft
1126 1.1 mycroft int
1127 1.51 perseant lfs_rmdir(void *v)
1128 1.10 christos {
1129 1.314 riastrad struct vop_rmdir_v2_args /* {
1130 1.1 mycroft struct vnodeop_desc *a_desc;
1131 1.1 mycroft struct vnode *a_dvp;
1132 1.1 mycroft struct vnode *a_vp;
1133 1.1 mycroft struct componentname *a_cnp;
1134 1.10 christos } */ *ap = v;
1135 1.84 perseant struct vnode *vp;
1136 1.188 perseant struct inode *ip;
1137 1.37 perseant int error;
1138 1.1 mycroft
1139 1.84 perseant vp = ap->a_vp;
1140 1.311 riastrad
1141 1.311 riastrad KASSERT(VOP_ISLOCKED(ap->a_dvp) == LK_EXCLUSIVE);
1142 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
1143 1.311 riastrad
1144 1.188 perseant ip = VTOI(vp);
1145 1.264 dholland if ((error = lfs_set_dirop(ap->a_dvp, ap->a_vp)) != 0) {
1146 1.194 chs if (ap->a_dvp == vp)
1147 1.314 riastrad vrele(vp);
1148 1.194 chs else
1149 1.314 riastrad vput(vp);
1150 1.37 perseant return error;
1151 1.34 perseant }
1152 1.245 dholland error = ulfs_rmdir(ap);
1153 1.188 perseant if (ip->i_nlink == 0)
1154 1.188 perseant lfs_orphan(ip->i_lfs, ip->i_number);
1155 1.264 dholland
1156 1.264 dholland UNMARK_VNODE(ap->a_dvp);
1157 1.264 dholland if (ap->a_vp) {
1158 1.264 dholland UNMARK_VNODE(ap->a_vp);
1159 1.264 dholland }
1160 1.264 dholland lfs_unset_dirop(ip->i_lfs, ap->a_dvp, "rmdir");
1161 1.264 dholland vrele(ap->a_dvp);
1162 1.264 dholland if (ap->a_vp) {
1163 1.264 dholland vrele(ap->a_vp);
1164 1.264 dholland }
1165 1.264 dholland
1166 1.37 perseant return (error);
1167 1.1 mycroft }
1168 1.1 mycroft
1169 1.1 mycroft int
1170 1.51 perseant lfs_link(void *v)
1171 1.10 christos {
1172 1.271 riastrad struct vop_link_v2_args /* {
1173 1.9 mycroft struct vnode *a_dvp;
1174 1.1 mycroft struct vnode *a_vp;
1175 1.1 mycroft struct componentname *a_cnp;
1176 1.10 christos } */ *ap = v;
1177 1.264 dholland struct lfs *fs;
1178 1.265 dholland struct vnode *dvp;
1179 1.37 perseant int error;
1180 1.1 mycroft
1181 1.264 dholland dvp = ap->a_dvp;
1182 1.264 dholland
1183 1.311 riastrad KASSERT(VOP_ISLOCKED(dvp) == LK_EXCLUSIVE);
1184 1.311 riastrad
1185 1.264 dholland fs = VFSTOULFS(dvp->v_mount)->um_lfs;
1186 1.264 dholland ASSERT_NO_SEGLOCK(fs);
1187 1.264 dholland if (fs->lfs_ronly) {
1188 1.264 dholland return EROFS;
1189 1.264 dholland }
1190 1.264 dholland
1191 1.264 dholland error = lfs_set_dirop(dvp, NULL);
1192 1.264 dholland if (error) {
1193 1.37 perseant return error;
1194 1.34 perseant }
1195 1.264 dholland
1196 1.245 dholland error = ulfs_link(ap);
1197 1.264 dholland
1198 1.264 dholland UNMARK_VNODE(dvp);
1199 1.264 dholland lfs_unset_dirop(fs, dvp, "link");
1200 1.264 dholland vrele(dvp);
1201 1.264 dholland
1202 1.37 perseant return (error);
1203 1.1 mycroft }
1204 1.22 perseant
1205 1.1 mycroft /* XXX hack to avoid calling ITIMES in getattr */
1206 1.1 mycroft int
1207 1.51 perseant lfs_getattr(void *v)
1208 1.10 christos {
1209 1.1 mycroft struct vop_getattr_args /* {
1210 1.1 mycroft struct vnode *a_vp;
1211 1.1 mycroft struct vattr *a_vap;
1212 1.176 elad kauth_cred_t a_cred;
1213 1.10 christos } */ *ap = v;
1214 1.35 augustss struct vnode *vp = ap->a_vp;
1215 1.311 riastrad struct inode *ip;
1216 1.35 augustss struct vattr *vap = ap->a_vap;
1217 1.311 riastrad struct lfs *fs;
1218 1.311 riastrad
1219 1.311 riastrad KASSERT(VOP_ISLOCKED(vp));
1220 1.311 riastrad
1221 1.311 riastrad ip = VTOI(vp);
1222 1.311 riastrad fs = ip->i_lfs;
1223 1.251 dholland
1224 1.1 mycroft /*
1225 1.1 mycroft * Copy from inode table
1226 1.1 mycroft */
1227 1.1 mycroft vap->va_fsid = ip->i_dev;
1228 1.1 mycroft vap->va_fileid = ip->i_number;
1229 1.246 dholland vap->va_mode = ip->i_mode & ~LFS_IFMT;
1230 1.102 fvdl vap->va_nlink = ip->i_nlink;
1231 1.102 fvdl vap->va_uid = ip->i_uid;
1232 1.102 fvdl vap->va_gid = ip->i_gid;
1233 1.288 dholland switch (vp->v_type) {
1234 1.288 dholland case VBLK:
1235 1.288 dholland case VCHR:
1236 1.288 dholland vap->va_rdev = (dev_t)lfs_dino_getrdev(fs, ip->i_din);
1237 1.288 dholland break;
1238 1.288 dholland default:
1239 1.288 dholland vap->va_rdev = NODEV;
1240 1.288 dholland break;
1241 1.288 dholland }
1242 1.55 chs vap->va_size = vp->v_size;
1243 1.288 dholland vap->va_atime.tv_sec = lfs_dino_getatime(fs, ip->i_din);
1244 1.288 dholland vap->va_atime.tv_nsec = lfs_dino_getatimensec(fs, ip->i_din);
1245 1.288 dholland vap->va_mtime.tv_sec = lfs_dino_getmtime(fs, ip->i_din);
1246 1.288 dholland vap->va_mtime.tv_nsec = lfs_dino_getmtimensec(fs, ip->i_din);
1247 1.288 dholland vap->va_ctime.tv_sec = lfs_dino_getctime(fs, ip->i_din);
1248 1.288 dholland vap->va_ctime.tv_nsec = lfs_dino_getctimensec(fs, ip->i_din);
1249 1.102 fvdl vap->va_flags = ip->i_flags;
1250 1.102 fvdl vap->va_gen = ip->i_gen;
1251 1.1 mycroft /* this doesn't belong here */
1252 1.1 mycroft if (vp->v_type == VBLK)
1253 1.1 mycroft vap->va_blocksize = BLKDEV_IOSIZE;
1254 1.1 mycroft else if (vp->v_type == VCHR)
1255 1.1 mycroft vap->va_blocksize = MAXBSIZE;
1256 1.1 mycroft else
1257 1.1 mycroft vap->va_blocksize = vp->v_mount->mnt_stat.f_iosize;
1258 1.279 dholland vap->va_bytes = lfs_fsbtob(fs, ip->i_lfs_effnblks);
1259 1.1 mycroft vap->va_type = vp->v_type;
1260 1.1 mycroft vap->va_filerev = ip->i_modrev;
1261 1.1 mycroft return (0);
1262 1.61 perseant }
1263 1.61 perseant
1264 1.61 perseant /*
1265 1.61 perseant * Check to make sure the inode blocks won't choke the buffer
1266 1.245 dholland * cache, then call ulfs_setattr as usual.
1267 1.61 perseant */
1268 1.61 perseant int
1269 1.61 perseant lfs_setattr(void *v)
1270 1.61 perseant {
1271 1.149 skrll struct vop_setattr_args /* {
1272 1.61 perseant struct vnode *a_vp;
1273 1.61 perseant struct vattr *a_vap;
1274 1.176 elad kauth_cred_t a_cred;
1275 1.61 perseant } */ *ap = v;
1276 1.61 perseant struct vnode *vp = ap->a_vp;
1277 1.61 perseant
1278 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
1279 1.61 perseant lfs_check(vp, LFS_UNUSED_LBN, 0);
1280 1.245 dholland return ulfs_setattr(v);
1281 1.1 mycroft }
1282 1.22 perseant
1283 1.1 mycroft /*
1284 1.179 perseant * Release the block we hold on lfs_newseg wrapping. Called on file close,
1285 1.188 perseant * or explicitly from LFCNWRAPGO. Called with the interlock held.
1286 1.179 perseant */
1287 1.179 perseant static int
1288 1.193 christos lfs_wrapgo(struct lfs *fs, struct inode *ip, int waitfor)
1289 1.179 perseant {
1290 1.214 ad if (fs->lfs_stoplwp != curlwp)
1291 1.179 perseant return EBUSY;
1292 1.179 perseant
1293 1.214 ad fs->lfs_stoplwp = NULL;
1294 1.214 ad cv_signal(&fs->lfs_stopcv);
1295 1.179 perseant
1296 1.179 perseant KASSERT(fs->lfs_nowrap > 0);
1297 1.179 perseant if (fs->lfs_nowrap <= 0) {
1298 1.179 perseant return 0;
1299 1.179 perseant }
1300 1.179 perseant
1301 1.179 perseant if (--fs->lfs_nowrap == 0) {
1302 1.275 dholland log(LOG_NOTICE, "%s: re-enabled log wrap\n",
1303 1.275 dholland lfs_sb_getfsmnt(fs));
1304 1.188 perseant wakeup(&fs->lfs_wrappass);
1305 1.180 perseant lfs_wakeup_cleaner(fs);
1306 1.179 perseant }
1307 1.179 perseant if (waitfor) {
1308 1.318 maya cv_wait_sig(&fs->lfs_nextsegsleep, &lfs_lock);
1309 1.179 perseant }
1310 1.179 perseant
1311 1.179 perseant return 0;
1312 1.179 perseant }
1313 1.179 perseant
1314 1.179 perseant /*
1315 1.251 dholland * Close called.
1316 1.251 dholland *
1317 1.251 dholland * Update the times on the inode.
1318 1.1 mycroft */
1319 1.1 mycroft /* ARGSUSED */
1320 1.1 mycroft int
1321 1.51 perseant lfs_close(void *v)
1322 1.10 christos {
1323 1.1 mycroft struct vop_close_args /* {
1324 1.1 mycroft struct vnode *a_vp;
1325 1.1 mycroft int a_fflag;
1326 1.176 elad kauth_cred_t a_cred;
1327 1.10 christos } */ *ap = v;
1328 1.35 augustss struct vnode *vp = ap->a_vp;
1329 1.311 riastrad struct inode *ip;
1330 1.311 riastrad struct lfs *fs;
1331 1.311 riastrad
1332 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
1333 1.311 riastrad
1334 1.311 riastrad ip = VTOI(vp);
1335 1.311 riastrad fs = ip->i_lfs;
1336 1.1 mycroft
1337 1.245 dholland if ((ip->i_number == ULFS_ROOTINO || ip->i_number == LFS_IFILE_INUM) &&
1338 1.214 ad fs->lfs_stoplwp == curlwp) {
1339 1.214 ad mutex_enter(&lfs_lock);
1340 1.188 perseant log(LOG_NOTICE, "lfs_close: releasing log wrap control\n");
1341 1.180 perseant lfs_wrapgo(fs, ip, 0);
1342 1.214 ad mutex_exit(&lfs_lock);
1343 1.179 perseant }
1344 1.179 perseant
1345 1.97 perseant if (vp == ip->i_lfs->lfs_ivnode &&
1346 1.119 dbj vp->v_mount->mnt_iflag & IMNT_UNMOUNT)
1347 1.97 perseant return 0;
1348 1.97 perseant
1349 1.97 perseant if (vp->v_usecount > 1 && vp != ip->i_lfs->lfs_ivnode) {
1350 1.154 christos LFS_ITIMES(ip, NULL, NULL, NULL);
1351 1.1 mycroft }
1352 1.1 mycroft return (0);
1353 1.65 perseant }
1354 1.65 perseant
1355 1.65 perseant /*
1356 1.65 perseant * Close wrapper for special devices.
1357 1.65 perseant *
1358 1.65 perseant * Update the times on the inode then do device close.
1359 1.65 perseant */
1360 1.65 perseant int
1361 1.65 perseant lfsspec_close(void *v)
1362 1.65 perseant {
1363 1.65 perseant struct vop_close_args /* {
1364 1.65 perseant struct vnode *a_vp;
1365 1.65 perseant int a_fflag;
1366 1.176 elad kauth_cred_t a_cred;
1367 1.65 perseant } */ *ap = v;
1368 1.65 perseant struct vnode *vp;
1369 1.65 perseant struct inode *ip;
1370 1.65 perseant
1371 1.65 perseant vp = ap->a_vp;
1372 1.311 riastrad
1373 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
1374 1.311 riastrad
1375 1.65 perseant ip = VTOI(vp);
1376 1.65 perseant if (vp->v_usecount > 1) {
1377 1.154 christos LFS_ITIMES(ip, NULL, NULL, NULL);
1378 1.65 perseant }
1379 1.65 perseant return (VOCALL (spec_vnodeop_p, VOFFSET(vop_close), ap));
1380 1.65 perseant }
1381 1.65 perseant
1382 1.65 perseant /*
1383 1.65 perseant * Close wrapper for fifo's.
1384 1.65 perseant *
1385 1.65 perseant * Update the times on the inode then do device close.
1386 1.65 perseant */
1387 1.65 perseant int
1388 1.65 perseant lfsfifo_close(void *v)
1389 1.65 perseant {
1390 1.65 perseant struct vop_close_args /* {
1391 1.65 perseant struct vnode *a_vp;
1392 1.65 perseant int a_fflag;
1393 1.176 elad kauth_cred_ a_cred;
1394 1.65 perseant } */ *ap = v;
1395 1.65 perseant struct vnode *vp;
1396 1.65 perseant struct inode *ip;
1397 1.65 perseant
1398 1.65 perseant vp = ap->a_vp;
1399 1.311 riastrad
1400 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
1401 1.311 riastrad
1402 1.65 perseant ip = VTOI(vp);
1403 1.65 perseant if (ap->a_vp->v_usecount > 1) {
1404 1.154 christos LFS_ITIMES(ip, NULL, NULL, NULL);
1405 1.65 perseant }
1406 1.65 perseant return (VOCALL (fifo_vnodeop_p, VOFFSET(vop_close), ap));
1407 1.1 mycroft }
1408 1.1 mycroft
1409 1.1 mycroft /*
1410 1.15 fvdl * Reclaim an inode so that it can be used for other purposes.
1411 1.1 mycroft */
1412 1.1 mycroft
1413 1.1 mycroft int
1414 1.51 perseant lfs_reclaim(void *v)
1415 1.10 christos {
1416 1.315 riastrad struct vop_reclaim_v2_args /* {
1417 1.1 mycroft struct vnode *a_vp;
1418 1.10 christos } */ *ap = v;
1419 1.15 fvdl struct vnode *vp = ap->a_vp;
1420 1.311 riastrad struct inode *ip;
1421 1.311 riastrad struct lfs *fs;
1422 1.1 mycroft int error;
1423 1.77 yamt
1424 1.315 riastrad VOP_UNLOCK(vp);
1425 1.315 riastrad
1426 1.311 riastrad ip = VTOI(vp);
1427 1.311 riastrad fs = ip->i_lfs;
1428 1.311 riastrad
1429 1.231 hannken /*
1430 1.231 hannken * The inode must be freed and updated before being removed
1431 1.231 hannken * from its hash chain. Other threads trying to gain a hold
1432 1.262 hannken * or lock on the inode will be stalled.
1433 1.231 hannken */
1434 1.231 hannken if (ip->i_nlink <= 0 && (vp->v_mount->mnt_flag & MNT_RDONLY) == 0)
1435 1.231 hannken lfs_vfree(vp, ip->i_number, ip->i_omode);
1436 1.231 hannken
1437 1.214 ad mutex_enter(&lfs_lock);
1438 1.84 perseant LFS_CLR_UINO(ip, IN_ALLMOD);
1439 1.214 ad mutex_exit(&lfs_lock);
1440 1.245 dholland if ((error = ulfs_reclaim(vp)))
1441 1.1 mycroft return (error);
1442 1.203 perseant
1443 1.203 perseant /*
1444 1.203 perseant * Take us off the paging and/or dirop queues if we were on them.
1445 1.203 perseant * We shouldn't be on them.
1446 1.203 perseant */
1447 1.214 ad mutex_enter(&lfs_lock);
1448 1.317 maya if (ip->i_state & IN_PAGING) {
1449 1.203 perseant log(LOG_WARNING, "%s: reclaimed vnode is IN_PAGING\n",
1450 1.275 dholland lfs_sb_getfsmnt(fs));
1451 1.317 maya ip->i_state &= ~IN_PAGING;
1452 1.203 perseant TAILQ_REMOVE(&fs->lfs_pchainhd, ip, i_lfs_pchain);
1453 1.203 perseant }
1454 1.320 maya if (vp->v_uflag & VU_DIROP)
1455 1.212 ad panic("reclaimed vnode is VU_DIROP");
1456 1.214 ad mutex_exit(&lfs_lock);
1457 1.203 perseant
1458 1.287 dholland pool_put(&lfs_dinode_pool, ip->i_din);
1459 1.145 perseant lfs_deregister_all(vp);
1460 1.84 perseant pool_put(&lfs_inoext_pool, ip->inode_ext.lfs);
1461 1.84 perseant ip->inode_ext.lfs = NULL;
1462 1.199 ad genfs_node_destroy(vp);
1463 1.19 thorpej pool_put(&lfs_inode_pool, vp->v_data);
1464 1.1 mycroft vp->v_data = NULL;
1465 1.94 perseant return (0);
1466 1.94 perseant }
1467 1.94 perseant
1468 1.94 perseant /*
1469 1.101 yamt * Read a block from a storage device.
1470 1.251 dholland *
1471 1.251 dholland * Calculate the logical to physical mapping if not done already,
1472 1.251 dholland * then call the device strategy routine.
1473 1.251 dholland *
1474 1.94 perseant * In order to avoid reading blocks that are in the process of being
1475 1.94 perseant * written by the cleaner---and hence are not mutexed by the normal
1476 1.94 perseant * buffer cache / page cache mechanisms---check for collisions before
1477 1.94 perseant * reading.
1478 1.94 perseant *
1479 1.245 dholland * We inline ulfs_strategy to make sure that the VOP_BMAP occurs *before*
1480 1.94 perseant * the active cleaner test.
1481 1.94 perseant *
1482 1.94 perseant * XXX This code assumes that lfs_markv makes synchronous checkpoints.
1483 1.94 perseant */
1484 1.94 perseant int
1485 1.94 perseant lfs_strategy(void *v)
1486 1.94 perseant {
1487 1.94 perseant struct vop_strategy_args /* {
1488 1.128 hannken struct vnode *a_vp;
1489 1.94 perseant struct buf *a_bp;
1490 1.94 perseant } */ *ap = v;
1491 1.94 perseant struct buf *bp;
1492 1.94 perseant struct lfs *fs;
1493 1.94 perseant struct vnode *vp;
1494 1.94 perseant struct inode *ip;
1495 1.94 perseant daddr_t tbn;
1496 1.239 perseant #define MAXLOOP 25
1497 1.239 perseant int i, sn, error, slept, loopcount;
1498 1.94 perseant
1499 1.94 perseant bp = ap->a_bp;
1500 1.128 hannken vp = ap->a_vp;
1501 1.94 perseant ip = VTOI(vp);
1502 1.94 perseant fs = ip->i_lfs;
1503 1.94 perseant
1504 1.101 yamt /* lfs uses its strategy routine only for read */
1505 1.101 yamt KASSERT(bp->b_flags & B_READ);
1506 1.101 yamt
1507 1.94 perseant if (vp->v_type == VBLK || vp->v_type == VCHR)
1508 1.94 perseant panic("lfs_strategy: spec");
1509 1.94 perseant KASSERT(bp->b_bcount != 0);
1510 1.94 perseant if (bp->b_blkno == bp->b_lblkno) {
1511 1.94 perseant error = VOP_BMAP(vp, bp->b_lblkno, NULL, &bp->b_blkno,
1512 1.94 perseant NULL);
1513 1.94 perseant if (error) {
1514 1.94 perseant bp->b_error = error;
1515 1.214 ad bp->b_resid = bp->b_bcount;
1516 1.94 perseant biodone(bp);
1517 1.94 perseant return (error);
1518 1.94 perseant }
1519 1.94 perseant if ((long)bp->b_blkno == -1) /* no valid data */
1520 1.94 perseant clrbuf(bp);
1521 1.94 perseant }
1522 1.94 perseant if ((long)bp->b_blkno < 0) { /* block is not on disk */
1523 1.214 ad bp->b_resid = bp->b_bcount;
1524 1.94 perseant biodone(bp);
1525 1.94 perseant return (0);
1526 1.94 perseant }
1527 1.94 perseant
1528 1.94 perseant slept = 1;
1529 1.239 perseant loopcount = 0;
1530 1.214 ad mutex_enter(&lfs_lock);
1531 1.101 yamt while (slept && fs->lfs_seglock) {
1532 1.214 ad mutex_exit(&lfs_lock);
1533 1.94 perseant /*
1534 1.94 perseant * Look through list of intervals.
1535 1.94 perseant * There will only be intervals to look through
1536 1.94 perseant * if the cleaner holds the seglock.
1537 1.94 perseant * Since the cleaner is synchronous, we can trust
1538 1.94 perseant * the list of intervals to be current.
1539 1.94 perseant */
1540 1.248 christos tbn = LFS_DBTOFSB(fs, bp->b_blkno);
1541 1.248 christos sn = lfs_dtosn(fs, tbn);
1542 1.94 perseant slept = 0;
1543 1.94 perseant for (i = 0; i < fs->lfs_cleanind; i++) {
1544 1.248 christos if (sn == lfs_dtosn(fs, fs->lfs_cleanint[i]) &&
1545 1.94 perseant tbn >= fs->lfs_cleanint[i]) {
1546 1.136 perseant DLOG((DLOG_CLEAN,
1547 1.306 maya "lfs_strategy: ino %llu lbn %" PRId64
1548 1.280 dholland " ind %d sn %d fsb %" PRIx64
1549 1.203 perseant " given sn %d fsb %" PRIx64 "\n",
1550 1.306 maya (unsigned long long) ip->i_number,
1551 1.306 maya bp->b_lblkno, i,
1552 1.248 christos lfs_dtosn(fs, fs->lfs_cleanint[i]),
1553 1.203 perseant fs->lfs_cleanint[i], sn, tbn));
1554 1.136 perseant DLOG((DLOG_CLEAN,
1555 1.306 maya "lfs_strategy: sleeping on ino %llu lbn %"
1556 1.306 maya PRId64 "\n",
1557 1.306 maya (unsigned long long) ip->i_number,
1558 1.306 maya bp->b_lblkno));
1559 1.214 ad mutex_enter(&lfs_lock);
1560 1.170 perseant if (LFS_SEGLOCK_HELD(fs) && fs->lfs_iocount) {
1561 1.239 perseant /*
1562 1.239 perseant * Cleaner can't wait for itself.
1563 1.239 perseant * Instead, wait for the blocks
1564 1.239 perseant * to be written to disk.
1565 1.239 perseant * XXX we need pribio in the test
1566 1.239 perseant * XXX here.
1567 1.239 perseant */
1568 1.239 perseant mtsleep(&fs->lfs_iocount,
1569 1.239 perseant (PRIBIO + 1) | PNORELOCK,
1570 1.239 perseant "clean2", hz/10 + 1,
1571 1.239 perseant &lfs_lock);
1572 1.170 perseant slept = 1;
1573 1.239 perseant ++loopcount;
1574 1.170 perseant break;
1575 1.170 perseant } else if (fs->lfs_seglock) {
1576 1.214 ad mtsleep(&fs->lfs_seglock,
1577 1.141 perseant (PRIBIO + 1) | PNORELOCK,
1578 1.170 perseant "clean1", 0,
1579 1.214 ad &lfs_lock);
1580 1.167 perseant slept = 1;
1581 1.167 perseant break;
1582 1.167 perseant }
1583 1.214 ad mutex_exit(&lfs_lock);
1584 1.94 perseant }
1585 1.94 perseant }
1586 1.214 ad mutex_enter(&lfs_lock);
1587 1.239 perseant if (loopcount > MAXLOOP) {
1588 1.239 perseant printf("lfs_strategy: breaking out of clean2 loop\n");
1589 1.239 perseant break;
1590 1.239 perseant }
1591 1.94 perseant }
1592 1.214 ad mutex_exit(&lfs_lock);
1593 1.94 perseant
1594 1.94 perseant vp = ip->i_devvp;
1595 1.251 dholland return VOP_STRATEGY(vp, bp);
1596 1.89 perseant }
1597 1.89 perseant
1598 1.326 riastrad static struct evcnt lfs_dchain_marker_pass_flush =
1599 1.326 riastrad EVCNT_INITIALIZER(EVCNT_TYPE_MISC, NULL, "lfs", "dchain marker pass flush");
1600 1.326 riastrad EVCNT_ATTACH_STATIC(lfs_dchain_marker_pass_flush);
1601 1.326 riastrad
1602 1.239 perseant /*
1603 1.239 perseant * Inline lfs_segwrite/lfs_writevnodes, but just for dirops.
1604 1.239 perseant * Technically this is a checkpoint (the on-disk state is valid)
1605 1.239 perseant * even though we are leaving out all the file data.
1606 1.239 perseant */
1607 1.239 perseant int
1608 1.92 perseant lfs_flush_dirops(struct lfs *fs)
1609 1.92 perseant {
1610 1.326 riastrad struct inode *ip, *marker;
1611 1.92 perseant struct vnode *vp;
1612 1.285 dholland extern int lfs_dostats; /* XXX this does not belong here */
1613 1.92 perseant struct segment *sp;
1614 1.285 dholland SEGSUM *ssp;
1615 1.239 perseant int flags = 0;
1616 1.239 perseant int error = 0;
1617 1.92 perseant
1618 1.163 perseant ASSERT_MAYBE_SEGLOCK(fs);
1619 1.327 riastrad KASSERT(fs->lfs_nadirop == 0); /* stable during lfs_writer */
1620 1.327 riastrad KASSERT(fs->lfs_dirops == 0); /* stable during lfs_writer */
1621 1.141 perseant
1622 1.92 perseant if (fs->lfs_ronly)
1623 1.239 perseant return EROFS;
1624 1.92 perseant
1625 1.214 ad mutex_enter(&lfs_lock);
1626 1.141 perseant if (TAILQ_FIRST(&fs->lfs_dchainhd) == NULL) {
1627 1.214 ad mutex_exit(&lfs_lock);
1628 1.239 perseant return 0;
1629 1.141 perseant } else
1630 1.214 ad mutex_exit(&lfs_lock);
1631 1.92 perseant
1632 1.92 perseant if (lfs_dostats)
1633 1.92 perseant ++lfs_stats.flush_invoked;
1634 1.92 perseant
1635 1.326 riastrad marker = pool_get(&lfs_inode_pool, PR_WAITOK);
1636 1.326 riastrad memset(marker, 0, sizeof(*marker));
1637 1.326 riastrad marker->inode_ext.lfs = pool_get(&lfs_inoext_pool, PR_WAITOK);
1638 1.326 riastrad memset(marker->inode_ext.lfs, 0, sizeof(*marker->inode_ext.lfs));
1639 1.326 riastrad marker->i_state = IN_MARKER;
1640 1.326 riastrad
1641 1.92 perseant lfs_imtime(fs);
1642 1.239 perseant lfs_seglock(fs, flags);
1643 1.92 perseant sp = fs->lfs_sp;
1644 1.92 perseant
1645 1.92 perseant /*
1646 1.92 perseant * lfs_writevnodes, optimized to get dirops out of the way.
1647 1.92 perseant * Only write dirops, and don't flush files' pages, only
1648 1.92 perseant * blocks from the directories.
1649 1.92 perseant *
1650 1.92 perseant * We don't need to vref these files because they are
1651 1.92 perseant * dirops and so hold an extra reference until the
1652 1.92 perseant * segunlock clears them of that status.
1653 1.92 perseant *
1654 1.92 perseant * We don't need to check for IN_ADIROP because we know that
1655 1.92 perseant * no dirops are active.
1656 1.92 perseant *
1657 1.92 perseant */
1658 1.214 ad mutex_enter(&lfs_lock);
1659 1.327 riastrad KASSERT(fs->lfs_writer);
1660 1.326 riastrad TAILQ_INSERT_HEAD(&fs->lfs_dchainhd, marker, i_lfs_dchain);
1661 1.326 riastrad while ((ip = TAILQ_NEXT(marker, i_lfs_dchain)) != NULL) {
1662 1.326 riastrad TAILQ_REMOVE(&fs->lfs_dchainhd, marker, i_lfs_dchain);
1663 1.326 riastrad TAILQ_INSERT_AFTER(&fs->lfs_dchainhd, ip, marker,
1664 1.326 riastrad i_lfs_dchain);
1665 1.326 riastrad if (ip->i_state & IN_MARKER) {
1666 1.326 riastrad lfs_dchain_marker_pass_flush.ev_count++;
1667 1.326 riastrad continue;
1668 1.326 riastrad }
1669 1.92 perseant vp = ITOV(ip);
1670 1.92 perseant
1671 1.329 riastrad /*
1672 1.329 riastrad * Prevent the vnode from going away if it's just been
1673 1.329 riastrad * put out in the segment and lfs_unmark_dirop is about
1674 1.329 riastrad * to release it. While it is on the list it is always
1675 1.329 riastrad * referenced, so it cannot be reclaimed until we
1676 1.329 riastrad * release it.
1677 1.329 riastrad */
1678 1.329 riastrad vref(vp);
1679 1.329 riastrad
1680 1.329 riastrad /*
1681 1.329 riastrad * Since we hold lfs_writer, the node can't be in an
1682 1.329 riastrad * active dirop. Since it's on the list and we hold a
1683 1.329 riastrad * reference to it, it can't be reclaimed now.
1684 1.329 riastrad */
1685 1.317 maya KASSERT((ip->i_state & IN_ADIROP) == 0);
1686 1.239 perseant KASSERT(vp->v_uflag & VU_DIROP);
1687 1.329 riastrad
1688 1.329 riastrad /*
1689 1.329 riastrad * After we release lfs_lock, if we were in the middle
1690 1.329 riastrad * of writing a segment, lfs_unmark_dirop may end up
1691 1.329 riastrad * clearing VU_DIROP, and we have no way to stop it.
1692 1.329 riastrad * That should be OK -- we'll just have less to do
1693 1.329 riastrad * here.
1694 1.329 riastrad */
1695 1.329 riastrad mutex_exit(&lfs_lock);
1696 1.171 perseant
1697 1.92 perseant /*
1698 1.92 perseant * All writes to directories come from dirops; all
1699 1.92 perseant * writes to files' direct blocks go through the page
1700 1.92 perseant * cache, which we're not touching. Reads to files
1701 1.92 perseant * and/or directories will not be affected by writing
1702 1.92 perseant * directory blocks inodes and file inodes. So we don't
1703 1.239 perseant * really need to lock.
1704 1.92 perseant */
1705 1.92 perseant if (vp->v_type != VREG &&
1706 1.317 maya ((ip->i_state & IN_ALLMOD) || !VPISEMPTY(vp))) {
1707 1.239 perseant error = lfs_writefile(fs, sp, vp);
1708 1.92 perseant if (!VPISEMPTY(vp) && !WRITEINPROG(vp) &&
1709 1.317 maya !(ip->i_state & IN_ALLMOD)) {
1710 1.214 ad mutex_enter(&lfs_lock);
1711 1.92 perseant LFS_SET_UINO(ip, IN_MODIFIED);
1712 1.214 ad mutex_exit(&lfs_lock);
1713 1.92 perseant }
1714 1.239 perseant if (error && (sp->seg_flags & SEGM_SINGLE)) {
1715 1.329 riastrad vrele(vp);
1716 1.239 perseant mutex_enter(&lfs_lock);
1717 1.239 perseant error = EAGAIN;
1718 1.239 perseant break;
1719 1.239 perseant }
1720 1.92 perseant }
1721 1.328 riastrad KASSERT(ip->i_number != LFS_IFILE_INUM);
1722 1.239 perseant error = lfs_writeinode(fs, sp, ip);
1723 1.239 perseant if (error && (sp->seg_flags & SEGM_SINGLE)) {
1724 1.329 riastrad vrele(vp);
1725 1.329 riastrad mutex_enter(&lfs_lock);
1726 1.239 perseant error = EAGAIN;
1727 1.239 perseant break;
1728 1.239 perseant }
1729 1.239 perseant
1730 1.228 hannken /*
1731 1.239 perseant * We might need to update these inodes again,
1732 1.239 perseant * for example, if they have data blocks to write.
1733 1.239 perseant * Make sure that after this flush, they are still
1734 1.239 perseant * marked IN_MODIFIED so that we don't forget to
1735 1.239 perseant * write them.
1736 1.228 hannken */
1737 1.239 perseant /* XXX only for non-directories? --KS */
1738 1.329 riastrad mutex_enter(&lfs_lock);
1739 1.239 perseant LFS_SET_UINO(ip, IN_MODIFIED);
1740 1.329 riastrad mutex_exit(&lfs_lock);
1741 1.329 riastrad
1742 1.329 riastrad vrele(vp);
1743 1.329 riastrad mutex_enter(&lfs_lock);
1744 1.92 perseant }
1745 1.326 riastrad TAILQ_REMOVE(&fs->lfs_dchainhd, marker, i_lfs_dchain);
1746 1.214 ad mutex_exit(&lfs_lock);
1747 1.326 riastrad
1748 1.92 perseant /* We've written all the dirops there are */
1749 1.285 dholland ssp = (SEGSUM *)sp->segsum;
1750 1.285 dholland lfs_ss_setflags(fs, ssp, lfs_ss_getflags(fs, ssp) & ~(SS_CONT));
1751 1.170 perseant lfs_finalize_fs_seguse(fs);
1752 1.92 perseant (void) lfs_writeseg(fs, sp);
1753 1.92 perseant lfs_segunlock(fs);
1754 1.239 perseant
1755 1.326 riastrad pool_put(&lfs_inoext_pool, marker->inode_ext.lfs);
1756 1.326 riastrad pool_put(&lfs_inode_pool, marker);
1757 1.326 riastrad
1758 1.239 perseant return error;
1759 1.92 perseant }
1760 1.92 perseant
1761 1.89 perseant /*
1762 1.164 perseant * Flush all vnodes for which the pagedaemon has requested pageouts.
1763 1.212 ad * Skip over any files that are marked VU_DIROP (since lfs_flush_dirop()
1764 1.164 perseant * has just run, this would be an error). If we have to skip a vnode
1765 1.164 perseant * for any reason, just skip it; if we have to wait for the cleaner,
1766 1.164 perseant * abort. The writer daemon will call us again later.
1767 1.164 perseant */
1768 1.239 perseant int
1769 1.164 perseant lfs_flush_pchain(struct lfs *fs)
1770 1.164 perseant {
1771 1.164 perseant struct inode *ip, *nip;
1772 1.164 perseant struct vnode *vp;
1773 1.164 perseant extern int lfs_dostats;
1774 1.164 perseant struct segment *sp;
1775 1.239 perseant int error, error2;
1776 1.164 perseant
1777 1.164 perseant ASSERT_NO_SEGLOCK(fs);
1778 1.327 riastrad KASSERT(fs->lfs_writer);
1779 1.164 perseant
1780 1.164 perseant if (fs->lfs_ronly)
1781 1.239 perseant return EROFS;
1782 1.164 perseant
1783 1.214 ad mutex_enter(&lfs_lock);
1784 1.164 perseant if (TAILQ_FIRST(&fs->lfs_pchainhd) == NULL) {
1785 1.214 ad mutex_exit(&lfs_lock);
1786 1.239 perseant return 0;
1787 1.164 perseant } else
1788 1.214 ad mutex_exit(&lfs_lock);
1789 1.164 perseant
1790 1.164 perseant /* Get dirops out of the way */
1791 1.239 perseant if ((error = lfs_flush_dirops(fs)) != 0)
1792 1.239 perseant return error;
1793 1.164 perseant
1794 1.164 perseant if (lfs_dostats)
1795 1.164 perseant ++lfs_stats.flush_invoked;
1796 1.164 perseant
1797 1.164 perseant /*
1798 1.164 perseant * Inline lfs_segwrite/lfs_writevnodes, but just for pageouts.
1799 1.164 perseant */
1800 1.164 perseant lfs_imtime(fs);
1801 1.164 perseant lfs_seglock(fs, 0);
1802 1.164 perseant sp = fs->lfs_sp;
1803 1.164 perseant
1804 1.164 perseant /*
1805 1.164 perseant * lfs_writevnodes, optimized to clear pageout requests.
1806 1.164 perseant * Only write non-dirop files that are in the pageout queue.
1807 1.164 perseant * We're very conservative about what we write; we want to be
1808 1.164 perseant * fast and async.
1809 1.164 perseant */
1810 1.214 ad mutex_enter(&lfs_lock);
1811 1.214 ad top:
1812 1.164 perseant for (ip = TAILQ_FIRST(&fs->lfs_pchainhd); ip != NULL; ip = nip) {
1813 1.277 hannken struct mount *mp = ITOV(ip)->v_mount;
1814 1.277 hannken ino_t ino = ip->i_number;
1815 1.277 hannken
1816 1.164 perseant nip = TAILQ_NEXT(ip, i_lfs_pchain);
1817 1.164 perseant
1818 1.317 maya if (!(ip->i_state & IN_PAGING))
1819 1.164 perseant goto top;
1820 1.164 perseant
1821 1.277 hannken mutex_exit(&lfs_lock);
1822 1.277 hannken if (vcache_get(mp, &ino, sizeof(ino), &vp) != 0) {
1823 1.277 hannken mutex_enter(&lfs_lock);
1824 1.164 perseant continue;
1825 1.277 hannken };
1826 1.277 hannken if (vn_lock(vp, LK_EXCLUSIVE | LK_NOWAIT) != 0) {
1827 1.277 hannken vrele(vp);
1828 1.277 hannken mutex_enter(&lfs_lock);
1829 1.164 perseant continue;
1830 1.214 ad }
1831 1.277 hannken ip = VTOI(vp);
1832 1.277 hannken mutex_enter(&lfs_lock);
1833 1.277 hannken if ((vp->v_uflag & VU_DIROP) != 0 || vp->v_type != VREG ||
1834 1.317 maya !(ip->i_state & IN_PAGING)) {
1835 1.277 hannken mutex_exit(&lfs_lock);
1836 1.277 hannken vput(vp);
1837 1.214 ad mutex_enter(&lfs_lock);
1838 1.277 hannken goto top;
1839 1.165 perseant }
1840 1.277 hannken mutex_exit(&lfs_lock);
1841 1.164 perseant
1842 1.164 perseant error = lfs_writefile(fs, sp, vp);
1843 1.164 perseant if (!VPISEMPTY(vp) && !WRITEINPROG(vp) &&
1844 1.317 maya !(ip->i_state & IN_ALLMOD)) {
1845 1.214 ad mutex_enter(&lfs_lock);
1846 1.164 perseant LFS_SET_UINO(ip, IN_MODIFIED);
1847 1.214 ad mutex_exit(&lfs_lock);
1848 1.164 perseant }
1849 1.328 riastrad KASSERT(ip->i_number != LFS_IFILE_INUM);
1850 1.239 perseant error2 = lfs_writeinode(fs, sp, ip);
1851 1.164 perseant
1852 1.229 hannken VOP_UNLOCK(vp);
1853 1.272 hannken vrele(vp);
1854 1.164 perseant
1855 1.239 perseant if (error == EAGAIN || error2 == EAGAIN) {
1856 1.164 perseant lfs_writeseg(fs, sp);
1857 1.214 ad mutex_enter(&lfs_lock);
1858 1.164 perseant break;
1859 1.164 perseant }
1860 1.214 ad mutex_enter(&lfs_lock);
1861 1.164 perseant }
1862 1.214 ad mutex_exit(&lfs_lock);
1863 1.164 perseant (void) lfs_writeseg(fs, sp);
1864 1.164 perseant lfs_segunlock(fs);
1865 1.239 perseant
1866 1.239 perseant return 0;
1867 1.164 perseant }
1868 1.164 perseant
1869 1.164 perseant /*
1870 1.283 dholland * Conversion for compat.
1871 1.283 dholland */
1872 1.283 dholland static void
1873 1.283 dholland block_info_from_70(BLOCK_INFO *bi, const BLOCK_INFO_70 *bi70)
1874 1.283 dholland {
1875 1.283 dholland bi->bi_inode = bi70->bi_inode;
1876 1.283 dholland bi->bi_lbn = bi70->bi_lbn;
1877 1.283 dholland bi->bi_daddr = bi70->bi_daddr;
1878 1.283 dholland bi->bi_segcreate = bi70->bi_segcreate;
1879 1.283 dholland bi->bi_version = bi70->bi_version;
1880 1.283 dholland bi->bi_bp = bi70->bi_bp;
1881 1.283 dholland bi->bi_size = bi70->bi_size;
1882 1.283 dholland }
1883 1.283 dholland
1884 1.283 dholland static void
1885 1.283 dholland block_info_to_70(BLOCK_INFO_70 *bi70, const BLOCK_INFO *bi)
1886 1.283 dholland {
1887 1.283 dholland bi70->bi_inode = bi->bi_inode;
1888 1.283 dholland bi70->bi_lbn = bi->bi_lbn;
1889 1.283 dholland bi70->bi_daddr = bi->bi_daddr;
1890 1.283 dholland bi70->bi_segcreate = bi->bi_segcreate;
1891 1.283 dholland bi70->bi_version = bi->bi_version;
1892 1.283 dholland bi70->bi_bp = bi->bi_bp;
1893 1.283 dholland bi70->bi_size = bi->bi_size;
1894 1.283 dholland }
1895 1.283 dholland
1896 1.283 dholland /*
1897 1.90 perseant * Provide a fcntl interface to sys_lfs_{segwait,bmapv,markv}.
1898 1.89 perseant */
1899 1.89 perseant int
1900 1.90 perseant lfs_fcntl(void *v)
1901 1.89 perseant {
1902 1.137 simonb struct vop_fcntl_args /* {
1903 1.137 simonb struct vnode *a_vp;
1904 1.218 gmcgarry u_int a_command;
1905 1.201 christos void * a_data;
1906 1.137 simonb int a_fflag;
1907 1.176 elad kauth_cred_t a_cred;
1908 1.137 simonb } */ *ap = v;
1909 1.222 christos struct timeval tv;
1910 1.89 perseant struct timeval *tvp;
1911 1.89 perseant BLOCK_INFO *blkiov;
1912 1.283 dholland BLOCK_INFO_70 *blkiov70;
1913 1.92 perseant CLEANERINFO *cip;
1914 1.148 perseant SEGUSE *sup;
1915 1.283 dholland int blkcnt, i, error;
1916 1.181 martin size_t fh_size;
1917 1.90 perseant struct lfs_fcntl_markv blkvp;
1918 1.283 dholland struct lfs_fcntl_markv_70 blkvp70;
1919 1.185 ad struct lwp *l;
1920 1.89 perseant fsid_t *fsidp;
1921 1.92 perseant struct lfs *fs;
1922 1.92 perseant struct buf *bp;
1923 1.134 perseant fhandle_t *fhp;
1924 1.92 perseant daddr_t off;
1925 1.258 christos int oclean;
1926 1.89 perseant
1927 1.90 perseant /* Only respect LFS fcntls on fs root or Ifile */
1928 1.245 dholland if (VTOI(ap->a_vp)->i_number != ULFS_ROOTINO &&
1929 1.89 perseant VTOI(ap->a_vp)->i_number != LFS_IFILE_INUM) {
1930 1.245 dholland return ulfs_fcntl(v);
1931 1.89 perseant }
1932 1.89 perseant
1933 1.100 perseant /* Avoid locking a draining lock */
1934 1.119 dbj if (ap->a_vp->v_mount->mnt_iflag & IMNT_UNMOUNT) {
1935 1.100 perseant return ESHUTDOWN;
1936 1.100 perseant }
1937 1.100 perseant
1938 1.184 perseant /* LFS control and monitoring fcntls are available only to root */
1939 1.213 pooka l = curlwp;
1940 1.184 perseant if (((ap->a_command & 0xff00) >> 8) == 'L' &&
1941 1.241 elad (error = kauth_authorize_system(l->l_cred, KAUTH_SYSTEM_LFS,
1942 1.241 elad KAUTH_REQ_SYSTEM_LFS_FCNTL, NULL, NULL, NULL)) != 0)
1943 1.184 perseant return (error);
1944 1.184 perseant
1945 1.100 perseant fs = VTOI(ap->a_vp)->i_lfs;
1946 1.131 christos fsidp = &ap->a_vp->v_mount->mnt_stat.f_fsidx;
1947 1.89 perseant
1948 1.188 perseant error = 0;
1949 1.218 gmcgarry switch ((int)ap->a_command) {
1950 1.222 christos case LFCNSEGWAITALL_COMPAT_50:
1951 1.222 christos case LFCNSEGWAITALL_COMPAT:
1952 1.222 christos fsidp = NULL;
1953 1.283 dholland /* FALLTHROUGH */
1954 1.222 christos case LFCNSEGWAIT_COMPAT_50:
1955 1.222 christos case LFCNSEGWAIT_COMPAT:
1956 1.222 christos {
1957 1.222 christos struct timeval50 *tvp50
1958 1.222 christos = (struct timeval50 *)ap->a_data;
1959 1.222 christos timeval50_to_timeval(tvp50, &tv);
1960 1.222 christos tvp = &tv;
1961 1.222 christos }
1962 1.222 christos goto segwait_common;
1963 1.90 perseant case LFCNSEGWAITALL:
1964 1.214 ad fsidp = NULL;
1965 1.283 dholland /* FALLTHROUGH */
1966 1.90 perseant case LFCNSEGWAIT:
1967 1.214 ad tvp = (struct timeval *)ap->a_data;
1968 1.222 christos segwait_common:
1969 1.214 ad mutex_enter(&lfs_lock);
1970 1.214 ad ++fs->lfs_sleepers;
1971 1.214 ad mutex_exit(&lfs_lock);
1972 1.214 ad
1973 1.214 ad error = lfs_segwait(fsidp, tvp);
1974 1.214 ad
1975 1.214 ad mutex_enter(&lfs_lock);
1976 1.214 ad if (--fs->lfs_sleepers == 0)
1977 1.308 maya cv_broadcast(&fs->lfs_sleeperscv);
1978 1.214 ad mutex_exit(&lfs_lock);
1979 1.214 ad return error;
1980 1.89 perseant
1981 1.283 dholland case LFCNBMAPV_COMPAT_70:
1982 1.283 dholland case LFCNMARKV_COMPAT_70:
1983 1.283 dholland blkvp70 = *(struct lfs_fcntl_markv_70 *)ap->a_data;
1984 1.283 dholland
1985 1.283 dholland blkcnt = blkvp70.blkcnt;
1986 1.283 dholland if ((u_int) blkcnt > LFS_MARKV_MAXBLKCNT)
1987 1.283 dholland return (EINVAL);
1988 1.283 dholland blkiov = lfs_malloc(fs, blkcnt * sizeof(BLOCK_INFO), LFS_NB_BLKIOV);
1989 1.283 dholland blkiov70 = lfs_malloc(fs, sizeof(BLOCK_INFO_70), LFS_NB_BLKIOV);
1990 1.283 dholland for (i = 0; i < blkcnt; i++) {
1991 1.283 dholland error = copyin(&blkvp70.blkiov[i], blkiov70,
1992 1.283 dholland sizeof(*blkiov70));
1993 1.283 dholland if (error) {
1994 1.283 dholland lfs_free(fs, blkiov70, LFS_NB_BLKIOV);
1995 1.283 dholland lfs_free(fs, blkiov, LFS_NB_BLKIOV);
1996 1.283 dholland return error;
1997 1.283 dholland }
1998 1.283 dholland block_info_from_70(&blkiov[i], blkiov70);
1999 1.283 dholland }
2000 1.283 dholland
2001 1.283 dholland mutex_enter(&lfs_lock);
2002 1.283 dholland ++fs->lfs_sleepers;
2003 1.283 dholland mutex_exit(&lfs_lock);
2004 1.283 dholland if (ap->a_command == LFCNBMAPV)
2005 1.283 dholland error = lfs_bmapv(l, fsidp, blkiov, blkcnt);
2006 1.283 dholland else /* LFCNMARKV */
2007 1.283 dholland error = lfs_markv(l, fsidp, blkiov, blkcnt);
2008 1.283 dholland if (error == 0) {
2009 1.283 dholland for (i = 0; i < blkcnt; i++) {
2010 1.283 dholland block_info_to_70(blkiov70, &blkiov[i]);
2011 1.283 dholland error = copyout(blkiov70, &blkvp70.blkiov[i],
2012 1.283 dholland sizeof(*blkiov70));
2013 1.283 dholland if (error) {
2014 1.283 dholland break;
2015 1.283 dholland }
2016 1.283 dholland }
2017 1.283 dholland }
2018 1.283 dholland mutex_enter(&lfs_lock);
2019 1.283 dholland if (--fs->lfs_sleepers == 0)
2020 1.308 maya cv_broadcast(&fs->lfs_sleeperscv);
2021 1.283 dholland mutex_exit(&lfs_lock);
2022 1.283 dholland lfs_free(fs, blkiov, LFS_NB_BLKIOV);
2023 1.283 dholland return error;
2024 1.283 dholland
2025 1.90 perseant case LFCNBMAPV:
2026 1.90 perseant case LFCNMARKV:
2027 1.214 ad blkvp = *(struct lfs_fcntl_markv *)ap->a_data;
2028 1.89 perseant
2029 1.214 ad blkcnt = blkvp.blkcnt;
2030 1.214 ad if ((u_int) blkcnt > LFS_MARKV_MAXBLKCNT)
2031 1.214 ad return (EINVAL);
2032 1.214 ad blkiov = lfs_malloc(fs, blkcnt * sizeof(BLOCK_INFO), LFS_NB_BLKIOV);
2033 1.214 ad if ((error = copyin(blkvp.blkiov, blkiov,
2034 1.214 ad blkcnt * sizeof(BLOCK_INFO))) != 0) {
2035 1.214 ad lfs_free(fs, blkiov, LFS_NB_BLKIOV);
2036 1.214 ad return error;
2037 1.214 ad }
2038 1.214 ad
2039 1.214 ad mutex_enter(&lfs_lock);
2040 1.214 ad ++fs->lfs_sleepers;
2041 1.214 ad mutex_exit(&lfs_lock);
2042 1.214 ad if (ap->a_command == LFCNBMAPV)
2043 1.282 dholland error = lfs_bmapv(l, fsidp, blkiov, blkcnt);
2044 1.214 ad else /* LFCNMARKV */
2045 1.282 dholland error = lfs_markv(l, fsidp, blkiov, blkcnt);
2046 1.214 ad if (error == 0)
2047 1.214 ad error = copyout(blkiov, blkvp.blkiov,
2048 1.214 ad blkcnt * sizeof(BLOCK_INFO));
2049 1.214 ad mutex_enter(&lfs_lock);
2050 1.214 ad if (--fs->lfs_sleepers == 0)
2051 1.308 maya cv_broadcast(&fs->lfs_sleeperscv);
2052 1.214 ad mutex_exit(&lfs_lock);
2053 1.214 ad lfs_free(fs, blkiov, LFS_NB_BLKIOV);
2054 1.214 ad return error;
2055 1.92 perseant
2056 1.92 perseant case LFCNRECLAIM:
2057 1.214 ad /*
2058 1.214 ad * Flush dirops and write Ifile, allowing empty segments
2059 1.214 ad * to be immediately reclaimed.
2060 1.214 ad */
2061 1.214 ad lfs_writer_enter(fs, "pndirop");
2062 1.274 dholland off = lfs_sb_getoffset(fs);
2063 1.214 ad lfs_seglock(fs, SEGM_FORCE_CKP | SEGM_CKP);
2064 1.214 ad lfs_flush_dirops(fs);
2065 1.214 ad LFS_CLEANERINFO(cip, fs, bp);
2066 1.284 dholland oclean = lfs_ci_getclean(fs, cip);
2067 1.214 ad LFS_SYNC_CLEANERINFO(cip, fs, bp, 1);
2068 1.214 ad lfs_segwrite(ap->a_vp->v_mount, SEGM_FORCE_CKP);
2069 1.214 ad fs->lfs_sp->seg_flags |= SEGM_PROT;
2070 1.214 ad lfs_segunlock(fs);
2071 1.214 ad lfs_writer_leave(fs);
2072 1.92 perseant
2073 1.136 perseant #ifdef DEBUG
2074 1.214 ad LFS_CLEANERINFO(cip, fs, bp);
2075 1.214 ad DLOG((DLOG_CLEAN, "lfs_fcntl: reclaim wrote %" PRId64
2076 1.214 ad " blocks, cleaned %" PRId32 " segments (activesb %d)\n",
2077 1.284 dholland lfs_sb_getoffset(fs) - off,
2078 1.284 dholland lfs_ci_getclean(fs, cip) - oclean,
2079 1.214 ad fs->lfs_activesb));
2080 1.214 ad LFS_SYNC_CLEANERINFO(cip, fs, bp, 0);
2081 1.258 christos #else
2082 1.258 christos __USE(oclean);
2083 1.258 christos __USE(off);
2084 1.92 perseant #endif
2085 1.92 perseant
2086 1.214 ad return 0;
2087 1.89 perseant
2088 1.182 martin case LFCNIFILEFH_COMPAT:
2089 1.214 ad /* Return the filehandle of the Ifile */
2090 1.221 elad if ((error = kauth_authorize_system(l->l_cred,
2091 1.221 elad KAUTH_SYSTEM_FILEHANDLE, 0, NULL, NULL, NULL)) != 0)
2092 1.214 ad return (error);
2093 1.214 ad fhp = (struct fhandle *)ap->a_data;
2094 1.214 ad fhp->fh_fsid = *fsidp;
2095 1.214 ad fh_size = 16; /* former VFS_MAXFIDSIZ */
2096 1.214 ad return lfs_vptofh(fs->lfs_ivnode, &(fhp->fh_fid), &fh_size);
2097 1.182 martin
2098 1.187 martin case LFCNIFILEFH_COMPAT2:
2099 1.134 perseant case LFCNIFILEFH:
2100 1.214 ad /* Return the filehandle of the Ifile */
2101 1.214 ad fhp = (struct fhandle *)ap->a_data;
2102 1.214 ad fhp->fh_fsid = *fsidp;
2103 1.214 ad fh_size = sizeof(struct lfs_fhandle) -
2104 1.214 ad offsetof(fhandle_t, fh_fid);
2105 1.214 ad return lfs_vptofh(fs->lfs_ivnode, &(fhp->fh_fid), &fh_size);
2106 1.134 perseant
2107 1.148 perseant case LFCNREWIND:
2108 1.214 ad /* Move lfs_offset to the lowest-numbered segment */
2109 1.214 ad return lfs_rewind(fs, *(int *)ap->a_data);
2110 1.148 perseant
2111 1.148 perseant case LFCNINVAL:
2112 1.214 ad /* Mark a segment SEGUSE_INVAL */
2113 1.214 ad LFS_SEGENTRY(sup, fs, *(int *)ap->a_data, bp);
2114 1.214 ad if (sup->su_nbytes > 0) {
2115 1.214 ad brelse(bp, 0);
2116 1.214 ad lfs_unset_inval_all(fs);
2117 1.214 ad return EBUSY;
2118 1.214 ad }
2119 1.214 ad sup->su_flags |= SEGUSE_INVAL;
2120 1.236 hannken VOP_BWRITE(bp->b_vp, bp);
2121 1.214 ad return 0;
2122 1.148 perseant
2123 1.148 perseant case LFCNRESIZE:
2124 1.214 ad /* Resize the filesystem */
2125 1.214 ad return lfs_resize_fs(fs, *(int *)ap->a_data);
2126 1.148 perseant
2127 1.168 perseant case LFCNWRAPSTOP:
2128 1.179 perseant case LFCNWRAPSTOP_COMPAT:
2129 1.214 ad /*
2130 1.214 ad * Hold lfs_newseg at segment 0; if requested, sleep until
2131 1.214 ad * the filesystem wraps around. To support external agents
2132 1.214 ad * (dump, fsck-based regression test) that need to look at
2133 1.214 ad * a snapshot of the filesystem, without necessarily
2134 1.214 ad * requiring that all fs activity stops.
2135 1.214 ad */
2136 1.214 ad if (fs->lfs_stoplwp == curlwp)
2137 1.214 ad return EALREADY;
2138 1.214 ad
2139 1.214 ad mutex_enter(&lfs_lock);
2140 1.214 ad while (fs->lfs_stoplwp != NULL)
2141 1.214 ad cv_wait(&fs->lfs_stopcv, &lfs_lock);
2142 1.214 ad fs->lfs_stoplwp = curlwp;
2143 1.214 ad if (fs->lfs_nowrap == 0)
2144 1.275 dholland log(LOG_NOTICE, "%s: disabled log wrap\n",
2145 1.275 dholland lfs_sb_getfsmnt(fs));
2146 1.214 ad ++fs->lfs_nowrap;
2147 1.222 christos if (*(int *)ap->a_data == 1
2148 1.224 pooka || ap->a_command == LFCNWRAPSTOP_COMPAT) {
2149 1.214 ad log(LOG_NOTICE, "LFCNSTOPWRAP waiting for log wrap\n");
2150 1.214 ad error = mtsleep(&fs->lfs_nowrap, PCATCH | PUSER,
2151 1.214 ad "segwrap", 0, &lfs_lock);
2152 1.214 ad log(LOG_NOTICE, "LFCNSTOPWRAP done waiting\n");
2153 1.214 ad if (error) {
2154 1.214 ad lfs_wrapgo(fs, VTOI(ap->a_vp), 0);
2155 1.214 ad }
2156 1.214 ad }
2157 1.214 ad mutex_exit(&lfs_lock);
2158 1.214 ad return 0;
2159 1.168 perseant
2160 1.168 perseant case LFCNWRAPGO:
2161 1.179 perseant case LFCNWRAPGO_COMPAT:
2162 1.214 ad /*
2163 1.214 ad * Having done its work, the agent wakes up the writer.
2164 1.214 ad * If the argument is 1, it sleeps until a new segment
2165 1.214 ad * is selected.
2166 1.214 ad */
2167 1.214 ad mutex_enter(&lfs_lock);
2168 1.214 ad error = lfs_wrapgo(fs, VTOI(ap->a_vp),
2169 1.222 christos ap->a_command == LFCNWRAPGO_COMPAT ? 1 :
2170 1.222 christos *((int *)ap->a_data));
2171 1.214 ad mutex_exit(&lfs_lock);
2172 1.214 ad return error;
2173 1.168 perseant
2174 1.188 perseant case LFCNWRAPPASS:
2175 1.214 ad if ((VTOI(ap->a_vp)->i_lfs_iflags & LFSI_WRAPWAIT))
2176 1.214 ad return EALREADY;
2177 1.214 ad mutex_enter(&lfs_lock);
2178 1.214 ad if (fs->lfs_stoplwp != curlwp) {
2179 1.214 ad mutex_exit(&lfs_lock);
2180 1.214 ad return EALREADY;
2181 1.214 ad }
2182 1.214 ad if (fs->lfs_nowrap == 0) {
2183 1.214 ad mutex_exit(&lfs_lock);
2184 1.214 ad return EBUSY;
2185 1.214 ad }
2186 1.214 ad fs->lfs_wrappass = 1;
2187 1.214 ad wakeup(&fs->lfs_wrappass);
2188 1.214 ad /* Wait for the log to wrap, if asked */
2189 1.214 ad if (*(int *)ap->a_data) {
2190 1.272 hannken vref(ap->a_vp);
2191 1.214 ad VTOI(ap->a_vp)->i_lfs_iflags |= LFSI_WRAPWAIT;
2192 1.214 ad log(LOG_NOTICE, "LFCNPASS waiting for log wrap\n");
2193 1.214 ad error = mtsleep(&fs->lfs_nowrap, PCATCH | PUSER,
2194 1.214 ad "segwrap", 0, &lfs_lock);
2195 1.214 ad log(LOG_NOTICE, "LFCNPASS done waiting\n");
2196 1.214 ad VTOI(ap->a_vp)->i_lfs_iflags &= ~LFSI_WRAPWAIT;
2197 1.272 hannken vrele(ap->a_vp);
2198 1.214 ad }
2199 1.214 ad mutex_exit(&lfs_lock);
2200 1.214 ad return error;
2201 1.188 perseant
2202 1.188 perseant case LFCNWRAPSTATUS:
2203 1.214 ad mutex_enter(&lfs_lock);
2204 1.214 ad *(int *)ap->a_data = fs->lfs_wrapstatus;
2205 1.214 ad mutex_exit(&lfs_lock);
2206 1.214 ad return 0;
2207 1.188 perseant
2208 1.89 perseant default:
2209 1.245 dholland return ulfs_fcntl(v);
2210 1.89 perseant }
2211 1.89 perseant return 0;
2212 1.60 chs }
2213 1.60 chs
2214 1.84 perseant /*
2215 1.84 perseant * Return the last logical file offset that should be written for this file
2216 1.86 perseant * if we're doing a write that ends at "size". If writing, we need to know
2217 1.84 perseant * about sizes on disk, i.e. fragments if there are any; if reading, we need
2218 1.84 perseant * to know about entire blocks.
2219 1.84 perseant */
2220 1.84 perseant void
2221 1.84 perseant lfs_gop_size(struct vnode *vp, off_t size, off_t *eobp, int flags)
2222 1.84 perseant {
2223 1.84 perseant struct inode *ip = VTOI(vp);
2224 1.135 perry struct lfs *fs = ip->i_lfs;
2225 1.84 perseant daddr_t olbn, nlbn;
2226 1.84 perseant
2227 1.248 christos olbn = lfs_lblkno(fs, ip->i_size);
2228 1.248 christos nlbn = lfs_lblkno(fs, size);
2229 1.245 dholland if (!(flags & GOP_SIZE_MEM) && nlbn < ULFS_NDADDR && olbn <= nlbn) {
2230 1.248 christos *eobp = lfs_fragroundup(fs, size);
2231 1.86 perseant } else {
2232 1.248 christos *eobp = lfs_blkroundup(fs, size);
2233 1.86 perseant }
2234 1.84 perseant }
2235 1.84 perseant
2236 1.84 perseant #ifdef DEBUG
2237 1.84 perseant void lfs_dump_vop(void *);
2238 1.84 perseant
2239 1.84 perseant void
2240 1.84 perseant lfs_dump_vop(void *v)
2241 1.84 perseant {
2242 1.86 perseant struct vop_putpages_args /* {
2243 1.86 perseant struct vnode *a_vp;
2244 1.86 perseant voff_t a_offlo;
2245 1.86 perseant voff_t a_offhi;
2246 1.86 perseant int a_flags;
2247 1.86 perseant } */ *ap = v;
2248 1.84 perseant
2249 1.286 dholland struct inode *ip = VTOI(ap->a_vp);
2250 1.286 dholland struct lfs *fs = ip->i_lfs;
2251 1.286 dholland
2252 1.106 ragge #ifdef DDB
2253 1.84 perseant vfs_vnode_print(ap->a_vp, 0, printf);
2254 1.106 ragge #endif
2255 1.287 dholland lfs_dump_dinode(fs, ip->i_din);
2256 1.84 perseant }
2257 1.84 perseant #endif
2258 1.84 perseant
2259 1.84 perseant int
2260 1.84 perseant lfs_mmap(void *v)
2261 1.84 perseant {
2262 1.84 perseant struct vop_mmap_args /* {
2263 1.86 perseant const struct vnodeop_desc *a_desc;
2264 1.86 perseant struct vnode *a_vp;
2265 1.209 pooka vm_prot_t a_prot;
2266 1.176 elad kauth_cred_t a_cred;
2267 1.84 perseant } */ *ap = v;
2268 1.84 perseant
2269 1.84 perseant if (VTOI(ap->a_vp)->i_number == LFS_IFILE_INUM)
2270 1.84 perseant return EOPNOTSUPP;
2271 1.245 dholland return ulfs_mmap(v);
2272 1.84 perseant }
2273 1.254 dholland
2274 1.254 dholland static int
2275 1.254 dholland lfs_openextattr(void *v)
2276 1.254 dholland {
2277 1.254 dholland struct vop_openextattr_args /* {
2278 1.254 dholland struct vnode *a_vp;
2279 1.254 dholland kauth_cred_t a_cred;
2280 1.254 dholland struct proc *a_p;
2281 1.254 dholland } */ *ap = v;
2282 1.311 riastrad struct vnode *vp = ap->a_vp;
2283 1.311 riastrad struct inode *ip;
2284 1.311 riastrad struct ulfsmount *ump;
2285 1.311 riastrad
2286 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
2287 1.311 riastrad
2288 1.311 riastrad ip = VTOI(vp);
2289 1.311 riastrad ump = ip->i_ump;
2290 1.254 dholland
2291 1.254 dholland /* Not supported for ULFS1 file systems. */
2292 1.254 dholland if (ump->um_fstype == ULFS1)
2293 1.254 dholland return (EOPNOTSUPP);
2294 1.254 dholland
2295 1.254 dholland /* XXX Not implemented for ULFS2 file systems. */
2296 1.254 dholland return (EOPNOTSUPP);
2297 1.254 dholland }
2298 1.254 dholland
2299 1.254 dholland static int
2300 1.254 dholland lfs_closeextattr(void *v)
2301 1.254 dholland {
2302 1.254 dholland struct vop_closeextattr_args /* {
2303 1.254 dholland struct vnode *a_vp;
2304 1.254 dholland int a_commit;
2305 1.254 dholland kauth_cred_t a_cred;
2306 1.254 dholland struct proc *a_p;
2307 1.254 dholland } */ *ap = v;
2308 1.311 riastrad struct vnode *vp = ap->a_vp;
2309 1.311 riastrad struct inode *ip;
2310 1.311 riastrad struct ulfsmount *ump;
2311 1.311 riastrad
2312 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
2313 1.311 riastrad
2314 1.312 riastrad ip = VTOI(vp);
2315 1.311 riastrad ump = ip->i_ump;
2316 1.254 dholland
2317 1.254 dholland /* Not supported for ULFS1 file systems. */
2318 1.254 dholland if (ump->um_fstype == ULFS1)
2319 1.254 dholland return (EOPNOTSUPP);
2320 1.254 dholland
2321 1.254 dholland /* XXX Not implemented for ULFS2 file systems. */
2322 1.254 dholland return (EOPNOTSUPP);
2323 1.254 dholland }
2324 1.254 dholland
2325 1.254 dholland static int
2326 1.254 dholland lfs_getextattr(void *v)
2327 1.254 dholland {
2328 1.254 dholland struct vop_getextattr_args /* {
2329 1.254 dholland struct vnode *a_vp;
2330 1.254 dholland int a_attrnamespace;
2331 1.254 dholland const char *a_name;
2332 1.254 dholland struct uio *a_uio;
2333 1.254 dholland size_t *a_size;
2334 1.254 dholland kauth_cred_t a_cred;
2335 1.254 dholland struct proc *a_p;
2336 1.254 dholland } */ *ap = v;
2337 1.254 dholland struct vnode *vp = ap->a_vp;
2338 1.311 riastrad struct inode *ip;
2339 1.311 riastrad struct ulfsmount *ump;
2340 1.254 dholland int error;
2341 1.254 dholland
2342 1.311 riastrad KASSERT(VOP_ISLOCKED(vp));
2343 1.311 riastrad
2344 1.311 riastrad ip = VTOI(vp);
2345 1.311 riastrad ump = ip->i_ump;
2346 1.311 riastrad
2347 1.254 dholland if (ump->um_fstype == ULFS1) {
2348 1.254 dholland #ifdef LFS_EXTATTR
2349 1.254 dholland error = ulfs_getextattr(ap);
2350 1.254 dholland #else
2351 1.254 dholland error = EOPNOTSUPP;
2352 1.254 dholland #endif
2353 1.254 dholland return error;
2354 1.254 dholland }
2355 1.254 dholland
2356 1.254 dholland /* XXX Not implemented for ULFS2 file systems. */
2357 1.254 dholland return (EOPNOTSUPP);
2358 1.254 dholland }
2359 1.254 dholland
2360 1.254 dholland static int
2361 1.254 dholland lfs_setextattr(void *v)
2362 1.254 dholland {
2363 1.254 dholland struct vop_setextattr_args /* {
2364 1.254 dholland struct vnode *a_vp;
2365 1.254 dholland int a_attrnamespace;
2366 1.254 dholland const char *a_name;
2367 1.254 dholland struct uio *a_uio;
2368 1.254 dholland kauth_cred_t a_cred;
2369 1.254 dholland struct proc *a_p;
2370 1.254 dholland } */ *ap = v;
2371 1.254 dholland struct vnode *vp = ap->a_vp;
2372 1.311 riastrad struct inode *ip;
2373 1.311 riastrad struct ulfsmount *ump;
2374 1.254 dholland int error;
2375 1.254 dholland
2376 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
2377 1.311 riastrad
2378 1.311 riastrad ip = VTOI(vp);
2379 1.311 riastrad ump = ip->i_ump;
2380 1.311 riastrad
2381 1.254 dholland if (ump->um_fstype == ULFS1) {
2382 1.254 dholland #ifdef LFS_EXTATTR
2383 1.254 dholland error = ulfs_setextattr(ap);
2384 1.254 dholland #else
2385 1.254 dholland error = EOPNOTSUPP;
2386 1.254 dholland #endif
2387 1.254 dholland return error;
2388 1.254 dholland }
2389 1.254 dholland
2390 1.254 dholland /* XXX Not implemented for ULFS2 file systems. */
2391 1.254 dholland return (EOPNOTSUPP);
2392 1.254 dholland }
2393 1.254 dholland
2394 1.254 dholland static int
2395 1.254 dholland lfs_listextattr(void *v)
2396 1.254 dholland {
2397 1.254 dholland struct vop_listextattr_args /* {
2398 1.254 dholland struct vnode *a_vp;
2399 1.254 dholland int a_attrnamespace;
2400 1.254 dholland struct uio *a_uio;
2401 1.254 dholland size_t *a_size;
2402 1.254 dholland kauth_cred_t a_cred;
2403 1.254 dholland struct proc *a_p;
2404 1.254 dholland } */ *ap = v;
2405 1.254 dholland struct vnode *vp = ap->a_vp;
2406 1.311 riastrad struct inode *ip;
2407 1.311 riastrad struct ulfsmount *ump;
2408 1.254 dholland int error;
2409 1.254 dholland
2410 1.311 riastrad KASSERT(VOP_ISLOCKED(vp));
2411 1.311 riastrad
2412 1.311 riastrad ip = VTOI(vp);
2413 1.311 riastrad ump = ip->i_ump;
2414 1.311 riastrad
2415 1.254 dholland if (ump->um_fstype == ULFS1) {
2416 1.254 dholland #ifdef LFS_EXTATTR
2417 1.254 dholland error = ulfs_listextattr(ap);
2418 1.254 dholland #else
2419 1.254 dholland error = EOPNOTSUPP;
2420 1.254 dholland #endif
2421 1.254 dholland return error;
2422 1.254 dholland }
2423 1.254 dholland
2424 1.254 dholland /* XXX Not implemented for ULFS2 file systems. */
2425 1.254 dholland return (EOPNOTSUPP);
2426 1.254 dholland }
2427 1.254 dholland
2428 1.254 dholland static int
2429 1.254 dholland lfs_deleteextattr(void *v)
2430 1.254 dholland {
2431 1.254 dholland struct vop_deleteextattr_args /* {
2432 1.254 dholland struct vnode *a_vp;
2433 1.254 dholland int a_attrnamespace;
2434 1.254 dholland kauth_cred_t a_cred;
2435 1.254 dholland struct proc *a_p;
2436 1.254 dholland } */ *ap = v;
2437 1.254 dholland struct vnode *vp = ap->a_vp;
2438 1.311 riastrad struct inode *ip;
2439 1.311 riastrad struct ulfsmount *ump;
2440 1.254 dholland int error;
2441 1.254 dholland
2442 1.311 riastrad KASSERT(VOP_ISLOCKED(vp) == LK_EXCLUSIVE);
2443 1.311 riastrad
2444 1.311 riastrad ip = VTOI(vp);
2445 1.311 riastrad ump = ip->i_ump;
2446 1.311 riastrad
2447 1.254 dholland if (ump->um_fstype == ULFS1) {
2448 1.254 dholland #ifdef LFS_EXTATTR
2449 1.254 dholland error = ulfs_deleteextattr(ap);
2450 1.254 dholland #else
2451 1.254 dholland error = EOPNOTSUPP;
2452 1.254 dholland #endif
2453 1.254 dholland return error;
2454 1.254 dholland }
2455 1.254 dholland
2456 1.254 dholland /* XXX Not implemented for ULFS2 file systems. */
2457 1.254 dholland return (EOPNOTSUPP);
2458 1.254 dholland }
2459 1.299 dholland
2460