ffs_inode.c revision 1.124 1 1.124 riastrad /* $NetBSD: ffs_inode.c,v 1.124 2017/03/18 05:26:40 riastradh Exp $ */
2 1.98 simonb
3 1.98 simonb /*-
4 1.98 simonb * Copyright (c) 2008 The NetBSD Foundation, Inc.
5 1.98 simonb * All rights reserved.
6 1.98 simonb *
7 1.98 simonb * This code is derived from software contributed to The NetBSD Foundation
8 1.98 simonb * by Wasabi Systems, Inc.
9 1.98 simonb *
10 1.98 simonb * Redistribution and use in source and binary forms, with or without
11 1.98 simonb * modification, are permitted provided that the following conditions
12 1.98 simonb * are met:
13 1.98 simonb * 1. Redistributions of source code must retain the above copyright
14 1.98 simonb * notice, this list of conditions and the following disclaimer.
15 1.98 simonb * 2. Redistributions in binary form must reproduce the above copyright
16 1.98 simonb * notice, this list of conditions and the following disclaimer in the
17 1.98 simonb * documentation and/or other materials provided with the distribution.
18 1.98 simonb *
19 1.98 simonb * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.98 simonb * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.98 simonb * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.98 simonb * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.98 simonb * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.98 simonb * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.98 simonb * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.98 simonb * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.98 simonb * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.98 simonb * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.98 simonb * POSSIBILITY OF SUCH DAMAGE.
30 1.98 simonb */
31 1.5 cgd
32 1.1 mycroft /*
33 1.1 mycroft * Copyright (c) 1982, 1986, 1989, 1993
34 1.1 mycroft * The Regents of the University of California. All rights reserved.
35 1.1 mycroft *
36 1.1 mycroft * Redistribution and use in source and binary forms, with or without
37 1.1 mycroft * modification, are permitted provided that the following conditions
38 1.1 mycroft * are met:
39 1.1 mycroft * 1. Redistributions of source code must retain the above copyright
40 1.1 mycroft * notice, this list of conditions and the following disclaimer.
41 1.1 mycroft * 2. Redistributions in binary form must reproduce the above copyright
42 1.1 mycroft * notice, this list of conditions and the following disclaimer in the
43 1.1 mycroft * documentation and/or other materials provided with the distribution.
44 1.60 agc * 3. Neither the name of the University nor the names of its contributors
45 1.1 mycroft * may be used to endorse or promote products derived from this software
46 1.1 mycroft * without specific prior written permission.
47 1.1 mycroft *
48 1.1 mycroft * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
49 1.1 mycroft * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
50 1.1 mycroft * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
51 1.1 mycroft * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
52 1.1 mycroft * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
53 1.1 mycroft * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
54 1.1 mycroft * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
55 1.1 mycroft * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
56 1.1 mycroft * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
57 1.1 mycroft * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
58 1.1 mycroft * SUCH DAMAGE.
59 1.1 mycroft *
60 1.18 fvdl * @(#)ffs_inode.c 8.13 (Berkeley) 4/21/95
61 1.1 mycroft */
62 1.46 lukem
63 1.46 lukem #include <sys/cdefs.h>
64 1.124 riastrad __KERNEL_RCSID(0, "$NetBSD: ffs_inode.c,v 1.124 2017/03/18 05:26:40 riastradh Exp $");
65 1.17 mrg
66 1.41 mrg #if defined(_KERNEL_OPT)
67 1.25 thorpej #include "opt_ffs.h"
68 1.20 scottr #include "opt_quota.h"
69 1.21 scottr #endif
70 1.1 mycroft
71 1.1 mycroft #include <sys/param.h>
72 1.1 mycroft #include <sys/systm.h>
73 1.98 simonb #include <sys/buf.h>
74 1.1 mycroft #include <sys/file.h>
75 1.98 simonb #include <sys/fstrans.h>
76 1.98 simonb #include <sys/kauth.h>
77 1.1 mycroft #include <sys/kernel.h>
78 1.109 para #include <sys/kmem.h>
79 1.98 simonb #include <sys/mount.h>
80 1.98 simonb #include <sys/proc.h>
81 1.98 simonb #include <sys/resourcevar.h>
82 1.1 mycroft #include <sys/trace.h>
83 1.98 simonb #include <sys/vnode.h>
84 1.98 simonb #include <sys/wapbl.h>
85 1.16 mrg
86 1.1 mycroft #include <ufs/ufs/quota.h>
87 1.1 mycroft #include <ufs/ufs/inode.h>
88 1.1 mycroft #include <ufs/ufs/ufsmount.h>
89 1.1 mycroft #include <ufs/ufs/ufs_extern.h>
90 1.19 bouyer #include <ufs/ufs/ufs_bswap.h>
91 1.98 simonb #include <ufs/ufs/ufs_wapbl.h>
92 1.1 mycroft
93 1.1 mycroft #include <ufs/ffs/fs.h>
94 1.1 mycroft #include <ufs/ffs/ffs_extern.h>
95 1.1 mycroft
96 1.72 thorpej static int ffs_indirtrunc(struct inode *, daddr_t, daddr_t, daddr_t, int,
97 1.72 thorpej int64_t *);
98 1.1 mycroft
99 1.1 mycroft /*
100 1.13 tls * Update the access, modified, and inode change times as specified
101 1.13 tls * by the IN_ACCESS, IN_UPDATE, and IN_CHANGE flags respectively.
102 1.13 tls * The IN_MODIFIED flag is used to specify that the inode needs to be
103 1.13 tls * updated but that the times have already been set. The access
104 1.13 tls * and modified times are taken from the second and third parameters;
105 1.13 tls * the inode change time is always taken from the current time. If
106 1.103 ad * UPDATE_WAIT flag is set, or UPDATE_DIROP is set then wait for the
107 1.103 ad * disk write of the inode to complete.
108 1.1 mycroft */
109 1.13 tls
110 1.1 mycroft int
111 1.77 yamt ffs_update(struct vnode *vp, const struct timespec *acc,
112 1.77 yamt const struct timespec *mod, int updflags)
113 1.9 christos {
114 1.30 augustss struct fs *fs;
115 1.1 mycroft struct buf *bp;
116 1.1 mycroft struct inode *ip;
117 1.1 mycroft int error;
118 1.86 christos void *cp;
119 1.34 mycroft int waitfor, flags;
120 1.1 mycroft
121 1.77 yamt if (vp->v_mount->mnt_flag & MNT_RDONLY)
122 1.11 mycroft return (0);
123 1.77 yamt ip = VTOI(vp);
124 1.77 yamt FFS_ITIMES(ip, acc, mod, NULL);
125 1.77 yamt if (updflags & UPDATE_CLOSE)
126 1.65 mycroft flags = ip->i_flag & (IN_MODIFIED | IN_ACCESSED);
127 1.65 mycroft else
128 1.65 mycroft flags = ip->i_flag & IN_MODIFIED;
129 1.34 mycroft if (flags == 0)
130 1.1 mycroft return (0);
131 1.1 mycroft fs = ip->i_fs;
132 1.31 perseant
133 1.35 mycroft if ((flags & IN_MODIFIED) != 0 &&
134 1.77 yamt (vp->v_mount->mnt_flag & MNT_ASYNC) == 0) {
135 1.77 yamt waitfor = updflags & UPDATE_WAIT;
136 1.103 ad if ((updflags & UPDATE_DIROP) != 0)
137 1.35 mycroft waitfor |= UPDATE_WAIT;
138 1.35 mycroft } else
139 1.35 mycroft waitfor = 0;
140 1.31 perseant
141 1.1 mycroft /*
142 1.1 mycroft * Ensure that uid and gid are correct. This is a temporary
143 1.1 mycroft * fix until fsck has been changed to do the update.
144 1.1 mycroft */
145 1.55 fvdl if (fs->fs_magic == FS_UFS1_MAGIC && /* XXX */
146 1.55 fvdl fs->fs_old_inodefmt < FS_44INODEFMT) { /* XXX */
147 1.55 fvdl ip->i_ffs1_ouid = ip->i_uid; /* XXX */
148 1.55 fvdl ip->i_ffs1_ogid = ip->i_gid; /* XXX */
149 1.18 fvdl } /* XXX */
150 1.9 christos error = bread(ip->i_devvp,
151 1.114 dholland FFS_FSBTODB(fs, ino_to_fsba(fs, ip->i_number)),
152 1.117 maxv (int)fs->fs_bsize, B_MODIFY, &bp);
153 1.9 christos if (error) {
154 1.1 mycroft return (error);
155 1.1 mycroft }
156 1.35 mycroft ip->i_flag &= ~(IN_MODIFIED | IN_ACCESSED);
157 1.98 simonb /* Keep unlinked inode list up to date */
158 1.110 matt KDASSERTMSG(DIP(ip, nlink) == ip->i_nlink,
159 1.110 matt "DIP(ip, nlink) [%d] == ip->i_nlink [%d]",
160 1.110 matt DIP(ip, nlink), ip->i_nlink);
161 1.98 simonb if (ip->i_mode) {
162 1.98 simonb if (ip->i_nlink > 0) {
163 1.98 simonb UFS_WAPBL_UNREGISTER_INODE(ip->i_ump->um_mountp,
164 1.98 simonb ip->i_number, ip->i_mode);
165 1.98 simonb } else {
166 1.98 simonb UFS_WAPBL_REGISTER_INODE(ip->i_ump->um_mountp,
167 1.98 simonb ip->i_number, ip->i_mode);
168 1.98 simonb }
169 1.98 simonb }
170 1.55 fvdl if (fs->fs_magic == FS_UFS1_MAGIC) {
171 1.86 christos cp = (char *)bp->b_data +
172 1.55 fvdl (ino_to_fsbo(fs, ip->i_number) * DINODE1_SIZE);
173 1.23 christos #ifdef FFS_EI
174 1.55 fvdl if (UFS_FSNEEDSWAP(fs))
175 1.55 fvdl ffs_dinode1_swap(ip->i_din.ffs1_din,
176 1.55 fvdl (struct ufs1_dinode *)cp);
177 1.55 fvdl else
178 1.55 fvdl #endif
179 1.55 fvdl memcpy(cp, ip->i_din.ffs1_din, DINODE1_SIZE);
180 1.55 fvdl } else {
181 1.86 christos cp = (char *)bp->b_data +
182 1.55 fvdl (ino_to_fsbo(fs, ip->i_number) * DINODE2_SIZE);
183 1.55 fvdl #ifdef FFS_EI
184 1.55 fvdl if (UFS_FSNEEDSWAP(fs))
185 1.55 fvdl ffs_dinode2_swap(ip->i_din.ffs2_din,
186 1.55 fvdl (struct ufs2_dinode *)cp);
187 1.55 fvdl else
188 1.23 christos #endif
189 1.55 fvdl memcpy(cp, ip->i_din.ffs2_din, DINODE2_SIZE);
190 1.55 fvdl }
191 1.35 mycroft if (waitfor) {
192 1.1 mycroft return (bwrite(bp));
193 1.29 fvdl } else {
194 1.1 mycroft bdwrite(bp);
195 1.1 mycroft return (0);
196 1.1 mycroft }
197 1.1 mycroft }
198 1.1 mycroft
199 1.1 mycroft #define SINGLE 0 /* index of single indirect block */
200 1.1 mycroft #define DOUBLE 1 /* index of double indirect block */
201 1.1 mycroft #define TRIPLE 2 /* index of triple indirect block */
202 1.1 mycroft /*
203 1.1 mycroft * Truncate the inode oip to at most length size, freeing the
204 1.1 mycroft * disk blocks.
205 1.1 mycroft */
206 1.9 christos int
207 1.92 pooka ffs_truncate(struct vnode *ovp, off_t length, int ioflag, kauth_cred_t cred)
208 1.9 christos {
209 1.53 fvdl daddr_t lastblock;
210 1.68 mycroft struct inode *oip = VTOI(ovp);
211 1.112 dholland daddr_t bn, lastiblock[UFS_NIADDR], indir_lbn[UFS_NIADDR];
212 1.112 dholland daddr_t blks[UFS_NDADDR + UFS_NIADDR];
213 1.30 augustss struct fs *fs;
214 1.85 yamt int offset, pgoffset, level;
215 1.118 jdolecek int64_t blocksreleased = 0;
216 1.77 yamt int i, aflag, nblocks;
217 1.38 chs int error, allerror = 0;
218 1.1 mycroft off_t osize;
219 1.67 mycroft int sync;
220 1.68 mycroft struct ufsmount *ump = oip->i_ump;
221 1.122 jdolecek void *dcookie;
222 1.1 mycroft
223 1.118 jdolecek UFS_WAPBL_JLOCK_ASSERT(ip->i_ump->um_mountp);
224 1.118 jdolecek
225 1.78 yamt if (ovp->v_type == VCHR || ovp->v_type == VBLK ||
226 1.78 yamt ovp->v_type == VFIFO || ovp->v_type == VSOCK) {
227 1.78 yamt KASSERT(oip->i_size == 0);
228 1.78 yamt return 0;
229 1.78 yamt }
230 1.78 yamt
231 1.2 pk if (length < 0)
232 1.3 mycroft return (EINVAL);
233 1.68 mycroft
234 1.1 mycroft if (ovp->v_type == VLNK &&
235 1.68 mycroft (oip->i_size < ump->um_maxsymlinklen ||
236 1.68 mycroft (ump->um_maxsymlinklen == 0 && DIP(oip, blocks) == 0))) {
237 1.38 chs KDASSERT(length == 0);
238 1.55 fvdl memset(SHORTLINK(oip), 0, (size_t)oip->i_size);
239 1.55 fvdl oip->i_size = 0;
240 1.57 kristerw DIP_ASSIGN(oip, size, 0);
241 1.1 mycroft oip->i_flag |= IN_CHANGE | IN_UPDATE;
242 1.77 yamt return (ffs_update(ovp, NULL, NULL, 0));
243 1.1 mycroft }
244 1.55 fvdl if (oip->i_size == length) {
245 1.104 bouyer /* still do a uvm_vnp_setsize() as writesize may be larger */
246 1.104 bouyer uvm_vnp_setsize(ovp, length);
247 1.1 mycroft oip->i_flag |= IN_CHANGE | IN_UPDATE;
248 1.77 yamt return (ffs_update(ovp, NULL, NULL, 0));
249 1.1 mycroft }
250 1.1 mycroft fs = oip->i_fs;
251 1.68 mycroft if (length > ump->um_maxfilesize)
252 1.38 chs return (EFBIG);
253 1.38 chs
254 1.63 hannken if ((oip->i_flags & SF_SNAPSHOT) != 0)
255 1.63 hannken ffs_snapremove(ovp);
256 1.63 hannken
257 1.55 fvdl osize = oip->i_size;
258 1.50 chs aflag = ioflag & IO_SYNC ? B_SYNC : 0;
259 1.29 fvdl
260 1.38 chs /*
261 1.38 chs * Lengthen the size of the file. We must ensure that the
262 1.38 chs * last byte of the file is allocated. Since the smallest
263 1.38 chs * value of osize is 0, length will be at least 1.
264 1.38 chs */
265 1.38 chs
266 1.38 chs if (osize < length) {
267 1.115 dholland if (ffs_lblkno(fs, osize) < UFS_NDADDR &&
268 1.115 dholland ffs_lblkno(fs, osize) != ffs_lblkno(fs, length) &&
269 1.115 dholland ffs_blkroundup(fs, osize) != osize) {
270 1.69 mycroft off_t eob;
271 1.69 mycroft
272 1.115 dholland eob = ffs_blkroundup(fs, osize);
273 1.87 yamt uvm_vnp_setwritesize(ovp, eob);
274 1.69 mycroft error = ufs_balloc_range(ovp, osize, eob - osize,
275 1.77 yamt cred, aflag);
276 1.108 bouyer if (error) {
277 1.108 bouyer (void) ffs_truncate(ovp, osize,
278 1.108 bouyer ioflag & IO_SYNC, cred);
279 1.48 chs return error;
280 1.108 bouyer }
281 1.48 chs if (ioflag & IO_SYNC) {
282 1.106 rmind mutex_enter(ovp->v_interlock);
283 1.49 chs VOP_PUTPAGES(ovp,
284 1.69 mycroft trunc_page(osize & fs->fs_bmask),
285 1.99 hannken round_page(eob), PGO_CLEANIT | PGO_SYNCIO |
286 1.99 hannken PGO_JOURNALLOCKED);
287 1.48 chs }
288 1.48 chs }
289 1.87 yamt uvm_vnp_setwritesize(ovp, length);
290 1.77 yamt error = ufs_balloc_range(ovp, length - 1, 1, cred, aflag);
291 1.45 chs if (error) {
292 1.92 pooka (void) ffs_truncate(ovp, osize, ioflag & IO_SYNC, cred);
293 1.68 mycroft return (error);
294 1.45 chs }
295 1.43 chs uvm_vnp_setsize(ovp, length);
296 1.38 chs oip->i_flag |= IN_CHANGE | IN_UPDATE;
297 1.55 fvdl KASSERT(ovp->v_size == oip->i_size);
298 1.77 yamt return (ffs_update(ovp, NULL, NULL, 0));
299 1.38 chs }
300 1.38 chs
301 1.38 chs /*
302 1.38 chs * When truncating a regular file down to a non-block-aligned size,
303 1.38 chs * we must zero the part of last block which is past the new EOF.
304 1.38 chs * We must synchronously flush the zeroed pages to disk
305 1.38 chs * since the new pages will be invalidated as soon as we
306 1.38 chs * inform the VM system of the new, smaller size.
307 1.48 chs * We must do this before acquiring the GLOCK, since fetching
308 1.38 chs * the pages will acquire the GLOCK internally.
309 1.38 chs * So there is a window where another thread could see a whole
310 1.38 chs * zeroed page past EOF, but that's life.
311 1.38 chs */
312 1.38 chs
313 1.113 dholland offset = ffs_blkoff(fs, length);
314 1.85 yamt pgoffset = length & PAGE_MASK;
315 1.85 yamt if (ovp->v_type == VREG && (pgoffset != 0 || offset != 0) &&
316 1.85 yamt osize > length) {
317 1.70 mycroft daddr_t lbn;
318 1.38 chs voff_t eoz;
319 1.85 yamt int size;
320 1.38 chs
321 1.85 yamt if (offset != 0) {
322 1.85 yamt error = ufs_balloc_range(ovp, length - 1, 1, cred,
323 1.85 yamt aflag);
324 1.85 yamt if (error)
325 1.85 yamt return error;
326 1.85 yamt }
327 1.115 dholland lbn = ffs_lblkno(fs, length);
328 1.113 dholland size = ffs_blksize(fs, oip, lbn);
329 1.115 dholland eoz = MIN(MAX(ffs_lblktosize(fs, lbn) + size, round_page(pgoffset)),
330 1.85 yamt osize);
331 1.107 hannken ubc_zerorange(&ovp->v_uobj, length, eoz - length,
332 1.107 hannken UBC_UNMAP_FLAG(ovp));
333 1.70 mycroft if (round_page(eoz) > round_page(length)) {
334 1.106 rmind mutex_enter(ovp->v_interlock);
335 1.70 mycroft error = VOP_PUTPAGES(ovp, round_page(length),
336 1.70 mycroft round_page(eoz),
337 1.99 hannken PGO_CLEANIT | PGO_DEACTIVATE | PGO_JOURNALLOCKED |
338 1.71 mycroft ((ioflag & IO_SYNC) ? PGO_SYNCIO : 0));
339 1.70 mycroft if (error)
340 1.70 mycroft return error;
341 1.70 mycroft }
342 1.38 chs }
343 1.38 chs
344 1.84 yamt genfs_node_wrlock(ovp);
345 1.55 fvdl oip->i_size = length;
346 1.57 kristerw DIP_ASSIGN(oip, size, length);
347 1.18 fvdl uvm_vnp_setsize(ovp, length);
348 1.1 mycroft /*
349 1.1 mycroft * Calculate index into inode's block list of
350 1.1 mycroft * last direct and indirect blocks (if any)
351 1.1 mycroft * which we want to keep. Lastblock is -1 when
352 1.1 mycroft * the file is truncated to 0.
353 1.1 mycroft */
354 1.115 dholland lastblock = ffs_lblkno(fs, length + fs->fs_bsize - 1) - 1;
355 1.112 dholland lastiblock[SINGLE] = lastblock - UFS_NDADDR;
356 1.113 dholland lastiblock[DOUBLE] = lastiblock[SINGLE] - FFS_NINDIR(fs);
357 1.113 dholland lastiblock[TRIPLE] = lastiblock[DOUBLE] - FFS_NINDIR(fs) * FFS_NINDIR(fs);
358 1.1 mycroft nblocks = btodb(fs->fs_bsize);
359 1.1 mycroft /*
360 1.1 mycroft * Update file and block pointers on disk before we start freeing
361 1.1 mycroft * blocks. If we crash before free'ing blocks below, the blocks
362 1.1 mycroft * will be returned to the free list. lastiblock values are also
363 1.1 mycroft * normalized to -1 for calls to ffs_indirtrunc below.
364 1.1 mycroft */
365 1.67 mycroft sync = 0;
366 1.55 fvdl for (level = TRIPLE; level >= SINGLE; level--) {
367 1.112 dholland blks[UFS_NDADDR + level] = DIP(oip, ib[level]);
368 1.112 dholland if (lastiblock[level] < 0 && blks[UFS_NDADDR + level] != 0) {
369 1.67 mycroft sync = 1;
370 1.57 kristerw DIP_ASSIGN(oip, ib[level], 0);
371 1.1 mycroft lastiblock[level] = -1;
372 1.1 mycroft }
373 1.55 fvdl }
374 1.112 dholland for (i = 0; i < UFS_NDADDR; i++) {
375 1.64 hannken blks[i] = DIP(oip, db[i]);
376 1.67 mycroft if (i > lastblock && blks[i] != 0) {
377 1.67 mycroft sync = 1;
378 1.57 kristerw DIP_ASSIGN(oip, db[i], 0);
379 1.67 mycroft }
380 1.67 mycroft }
381 1.68 mycroft oip->i_flag |= IN_CHANGE | IN_UPDATE;
382 1.67 mycroft if (sync) {
383 1.77 yamt error = ffs_update(ovp, NULL, NULL, UPDATE_WAIT);
384 1.67 mycroft if (error && !allerror)
385 1.67 mycroft allerror = error;
386 1.55 fvdl }
387 1.32 mycroft
388 1.1 mycroft /*
389 1.1 mycroft * Having written the new inode to disk, save its new configuration
390 1.1 mycroft * and put back the old block pointers long enough to process them.
391 1.1 mycroft * Note that we save the new block configuration so we can check it
392 1.1 mycroft * when we are done.
393 1.1 mycroft */
394 1.112 dholland for (i = 0; i < UFS_NDADDR; i++) {
395 1.64 hannken bn = DIP(oip, db[i]);
396 1.64 hannken DIP_ASSIGN(oip, db[i], blks[i]);
397 1.64 hannken blks[i] = bn;
398 1.55 fvdl }
399 1.112 dholland for (i = 0; i < UFS_NIADDR; i++) {
400 1.64 hannken bn = DIP(oip, ib[i]);
401 1.112 dholland DIP_ASSIGN(oip, ib[i], blks[UFS_NDADDR + i]);
402 1.112 dholland blks[UFS_NDADDR + i] = bn;
403 1.55 fvdl }
404 1.55 fvdl
405 1.55 fvdl oip->i_size = osize;
406 1.57 kristerw DIP_ASSIGN(oip, size, osize);
407 1.32 mycroft error = vtruncbuf(ovp, lastblock + 1, 0, 0);
408 1.32 mycroft if (error && !allerror)
409 1.32 mycroft allerror = error;
410 1.1 mycroft
411 1.1 mycroft /*
412 1.1 mycroft * Indirect blocks first.
413 1.1 mycroft */
414 1.112 dholland indir_lbn[SINGLE] = -UFS_NDADDR;
415 1.113 dholland indir_lbn[DOUBLE] = indir_lbn[SINGLE] - FFS_NINDIR(fs) - 1;
416 1.113 dholland indir_lbn[TRIPLE] = indir_lbn[DOUBLE] - FFS_NINDIR(fs) * FFS_NINDIR(fs) - 1;
417 1.1 mycroft for (level = TRIPLE; level >= SINGLE; level--) {
418 1.55 fvdl if (oip->i_ump->um_fstype == UFS1)
419 1.55 fvdl bn = ufs_rw32(oip->i_ffs1_ib[level],UFS_FSNEEDSWAP(fs));
420 1.55 fvdl else
421 1.55 fvdl bn = ufs_rw64(oip->i_ffs2_ib[level],UFS_FSNEEDSWAP(fs));
422 1.1 mycroft if (bn != 0) {
423 1.122 jdolecek if (lastiblock[level] < 0 &&
424 1.122 jdolecek oip->i_ump->um_mountp->mnt_wapbl) {
425 1.122 jdolecek error = UFS_WAPBL_REGISTER_DEALLOCATION(
426 1.122 jdolecek oip->i_ump->um_mountp,
427 1.122 jdolecek FFS_FSBTODB(fs, bn), fs->fs_bsize,
428 1.122 jdolecek &dcookie);
429 1.122 jdolecek if (error)
430 1.122 jdolecek goto out;
431 1.122 jdolecek } else {
432 1.122 jdolecek dcookie = NULL;
433 1.122 jdolecek }
434 1.122 jdolecek
435 1.1 mycroft error = ffs_indirtrunc(oip, indir_lbn[level],
436 1.118 jdolecek FFS_FSBTODB(fs, bn), lastiblock[level], level,
437 1.118 jdolecek &blocksreleased);
438 1.122 jdolecek if (error) {
439 1.122 jdolecek if (dcookie) {
440 1.122 jdolecek UFS_WAPBL_UNREGISTER_DEALLOCATION(
441 1.122 jdolecek oip->i_ump->um_mountp, dcookie);
442 1.122 jdolecek }
443 1.118 jdolecek goto out;
444 1.122 jdolecek }
445 1.118 jdolecek
446 1.1 mycroft if (lastiblock[level] < 0) {
447 1.122 jdolecek if (!dcookie)
448 1.98 simonb ffs_blkfree(fs, oip->i_devvp, bn,
449 1.98 simonb fs->fs_bsize, oip->i_number);
450 1.118 jdolecek DIP_ASSIGN(oip, ib[level], 0);
451 1.1 mycroft blocksreleased += nblocks;
452 1.1 mycroft }
453 1.1 mycroft }
454 1.1 mycroft if (lastiblock[level] >= 0)
455 1.1 mycroft goto done;
456 1.1 mycroft }
457 1.1 mycroft
458 1.1 mycroft /*
459 1.1 mycroft * All whole direct blocks or frags.
460 1.1 mycroft */
461 1.112 dholland for (i = UFS_NDADDR - 1; i > lastblock; i--) {
462 1.30 augustss long bsize;
463 1.1 mycroft
464 1.55 fvdl if (oip->i_ump->um_fstype == UFS1)
465 1.55 fvdl bn = ufs_rw32(oip->i_ffs1_db[i], UFS_FSNEEDSWAP(fs));
466 1.55 fvdl else
467 1.55 fvdl bn = ufs_rw64(oip->i_ffs2_db[i], UFS_FSNEEDSWAP(fs));
468 1.1 mycroft if (bn == 0)
469 1.1 mycroft continue;
470 1.118 jdolecek
471 1.113 dholland bsize = ffs_blksize(fs, oip, i);
472 1.98 simonb if ((oip->i_ump->um_mountp->mnt_wapbl) &&
473 1.98 simonb (ovp->v_type != VREG)) {
474 1.118 jdolecek error = UFS_WAPBL_REGISTER_DEALLOCATION(
475 1.118 jdolecek oip->i_ump->um_mountp,
476 1.122 jdolecek FFS_FSBTODB(fs, bn), bsize, NULL);
477 1.118 jdolecek if (error)
478 1.118 jdolecek goto out;
479 1.98 simonb } else
480 1.98 simonb ffs_blkfree(fs, oip->i_devvp, bn, bsize, oip->i_number);
481 1.118 jdolecek DIP_ASSIGN(oip, db[i], 0);
482 1.1 mycroft blocksreleased += btodb(bsize);
483 1.1 mycroft }
484 1.1 mycroft if (lastblock < 0)
485 1.1 mycroft goto done;
486 1.1 mycroft
487 1.1 mycroft /*
488 1.1 mycroft * Finally, look for a change in size of the
489 1.1 mycroft * last direct block; release any frags.
490 1.1 mycroft */
491 1.55 fvdl if (oip->i_ump->um_fstype == UFS1)
492 1.55 fvdl bn = ufs_rw32(oip->i_ffs1_db[lastblock], UFS_FSNEEDSWAP(fs));
493 1.55 fvdl else
494 1.55 fvdl bn = ufs_rw64(oip->i_ffs2_db[lastblock], UFS_FSNEEDSWAP(fs));
495 1.1 mycroft if (bn != 0) {
496 1.1 mycroft long oldspace, newspace;
497 1.1 mycroft
498 1.1 mycroft /*
499 1.1 mycroft * Calculate amount of space we're giving
500 1.1 mycroft * back as old block size minus new block size.
501 1.1 mycroft */
502 1.113 dholland oldspace = ffs_blksize(fs, oip, lastblock);
503 1.55 fvdl oip->i_size = length;
504 1.57 kristerw DIP_ASSIGN(oip, size, length);
505 1.113 dholland newspace = ffs_blksize(fs, oip, lastblock);
506 1.1 mycroft if (newspace == 0)
507 1.1 mycroft panic("itrunc: newspace");
508 1.1 mycroft if (oldspace - newspace > 0) {
509 1.1 mycroft /*
510 1.1 mycroft * Block number of space to be free'd is
511 1.1 mycroft * the old block # plus the number of frags
512 1.1 mycroft * required for the storage we're keeping.
513 1.1 mycroft */
514 1.115 dholland bn += ffs_numfrags(fs, newspace);
515 1.98 simonb if ((oip->i_ump->um_mountp->mnt_wapbl) &&
516 1.98 simonb (ovp->v_type != VREG)) {
517 1.118 jdolecek error = UFS_WAPBL_REGISTER_DEALLOCATION(
518 1.114 dholland oip->i_ump->um_mountp, FFS_FSBTODB(fs, bn),
519 1.122 jdolecek oldspace - newspace, NULL);
520 1.118 jdolecek if (error)
521 1.118 jdolecek goto out;
522 1.98 simonb } else
523 1.98 simonb ffs_blkfree(fs, oip->i_devvp, bn,
524 1.98 simonb oldspace - newspace, oip->i_number);
525 1.1 mycroft blocksreleased += btodb(oldspace - newspace);
526 1.1 mycroft }
527 1.1 mycroft }
528 1.32 mycroft
529 1.1 mycroft done:
530 1.1 mycroft for (level = SINGLE; level <= TRIPLE; level++)
531 1.124 riastrad KASSERTMSG((blks[UFS_NDADDR + level] == DIP(oip, ib[level])),
532 1.124 riastrad "itrunc1 blk mismatch: %jx != %jx",
533 1.124 riastrad (uintmax_t)blks[UFS_NDADDR + level],
534 1.124 riastrad (uintmax_t)DIP(oip, ib[level]));
535 1.112 dholland for (i = 0; i < UFS_NDADDR; i++)
536 1.124 riastrad KASSERTMSG((blks[i] == DIP(oip, db[i])),
537 1.124 riastrad "itrunc2 blk mismatch: %jx != %jx",
538 1.124 riastrad (uintmax_t)blks[i], (uintmax_t)DIP(oip, db[i]));
539 1.124 riastrad KASSERTMSG((length != 0 || LIST_EMPTY(&ovp->v_cleanblkhd)),
540 1.124 riastrad "itrunc3: zero length and nonempty cleanblkhd");
541 1.124 riastrad KASSERTMSG((length != 0 || LIST_EMPTY(&ovp->v_dirtyblkhd)),
542 1.124 riastrad "itrunc3: zero length and nonempty dirtyblkhd");
543 1.118 jdolecek
544 1.118 jdolecek out:
545 1.118 jdolecek /*
546 1.118 jdolecek * Set length back to old size if deallocation failed. Some indirect
547 1.118 jdolecek * blocks were deallocated creating a hole, but that is okay.
548 1.118 jdolecek */
549 1.118 jdolecek if (error == EAGAIN) {
550 1.121 jdolecek if (!allerror)
551 1.121 jdolecek allerror = error;
552 1.118 jdolecek length = osize;
553 1.118 jdolecek uvm_vnp_setsize(ovp, length);
554 1.118 jdolecek }
555 1.118 jdolecek
556 1.1 mycroft /*
557 1.1 mycroft * Put back the real size.
558 1.1 mycroft */
559 1.55 fvdl oip->i_size = length;
560 1.57 kristerw DIP_ASSIGN(oip, size, length);
561 1.57 kristerw DIP_ADD(oip, blocks, -blocksreleased);
562 1.84 yamt genfs_node_unlock(ovp);
563 1.1 mycroft oip->i_flag |= IN_CHANGE;
564 1.98 simonb UFS_WAPBL_UPDATE(ovp, NULL, NULL, 0);
565 1.105 bouyer #if defined(QUOTA) || defined(QUOTA2)
566 1.1 mycroft (void) chkdq(oip, -blocksreleased, NOCRED, 0);
567 1.1 mycroft #endif
568 1.55 fvdl KASSERT(ovp->v_type != VREG || ovp->v_size == oip->i_size);
569 1.1 mycroft return (allerror);
570 1.1 mycroft }
571 1.1 mycroft
572 1.1 mycroft /*
573 1.1 mycroft * Release blocks associated with the inode ip and stored in the indirect
574 1.1 mycroft * block bn. Blocks are free'd in LIFO order up to (but not including)
575 1.1 mycroft * lastbn. If level is greater than SINGLE, the block is an indirect block
576 1.1 mycroft * and recursive calls to indirtrunc must be used to cleanse other indirect
577 1.1 mycroft * blocks.
578 1.1 mycroft *
579 1.1 mycroft * NB: triple indirect blocks are untested.
580 1.1 mycroft */
581 1.1 mycroft static int
582 1.72 thorpej ffs_indirtrunc(struct inode *ip, daddr_t lbn, daddr_t dbn, daddr_t lastbn,
583 1.72 thorpej int level, int64_t *countp)
584 1.1 mycroft {
585 1.30 augustss int i;
586 1.1 mycroft struct buf *bp;
587 1.30 augustss struct fs *fs = ip->i_fs;
588 1.55 fvdl int32_t *bap1 = NULL;
589 1.55 fvdl int64_t *bap2 = NULL;
590 1.1 mycroft struct vnode *vp;
591 1.53 fvdl daddr_t nb, nlbn, last;
592 1.121 jdolecek char *copy = NULL;
593 1.118 jdolecek int64_t factor;
594 1.118 jdolecek int64_t nblocks;
595 1.121 jdolecek int error = 0, allerror = 0;
596 1.55 fvdl const int needswap = UFS_FSNEEDSWAP(fs);
597 1.121 jdolecek const int wapbl = (ip->i_ump->um_mountp->mnt_wapbl != NULL);
598 1.122 jdolecek void *dcookie;
599 1.118 jdolecek
600 1.55 fvdl #define RBAP(ip, i) (((ip)->i_ump->um_fstype == UFS1) ? \
601 1.55 fvdl ufs_rw32(bap1[i], needswap) : ufs_rw64(bap2[i], needswap))
602 1.57 kristerw #define BAP_ASSIGN(ip, i, value) \
603 1.57 kristerw do { \
604 1.57 kristerw if ((ip)->i_ump->um_fstype == UFS1) \
605 1.57 kristerw bap1[i] = (value); \
606 1.57 kristerw else \
607 1.57 kristerw bap2[i] = (value); \
608 1.57 kristerw } while(0)
609 1.1 mycroft
610 1.1 mycroft /*
611 1.1 mycroft * Calculate index in current block of last
612 1.1 mycroft * block to be kept. -1 indicates the entire
613 1.1 mycroft * block so we need not calculate the index.
614 1.1 mycroft */
615 1.1 mycroft factor = 1;
616 1.1 mycroft for (i = SINGLE; i < level; i++)
617 1.113 dholland factor *= FFS_NINDIR(fs);
618 1.1 mycroft last = lastbn;
619 1.1 mycroft if (lastbn > 0)
620 1.1 mycroft last /= factor;
621 1.1 mycroft nblocks = btodb(fs->fs_bsize);
622 1.1 mycroft /*
623 1.1 mycroft * Get buffer of block pointers, zero those entries corresponding
624 1.121 jdolecek * to blocks to be free'd, and update on disk copy first. Since
625 1.1 mycroft * double(triple) indirect before single(double) indirect, calls
626 1.1 mycroft * to bmap on these blocks will fail. However, we already have
627 1.1 mycroft * the on disk address, so we have to set the b_blkno field
628 1.1 mycroft * explicitly instead of letting bread do everything for us.
629 1.1 mycroft */
630 1.1 mycroft vp = ITOV(ip);
631 1.97 hannken error = ffs_getblk(vp, lbn, FFS_NOBLK, fs->fs_bsize, false, &bp);
632 1.118 jdolecek if (error)
633 1.97 hannken return error;
634 1.118 jdolecek
635 1.93 ad if (bp->b_oflags & (BO_DONE | BO_DELWRI)) {
636 1.1 mycroft /* Braces must be here in case trace evaluates to nothing. */
637 1.1 mycroft trace(TR_BREADHIT, pack(vp, fs->fs_bsize), lbn);
638 1.1 mycroft } else {
639 1.1 mycroft trace(TR_BREADMISS, pack(vp, fs->fs_bsize), lbn);
640 1.95 ad curlwp->l_ru.ru_inblock++; /* pay for read */
641 1.1 mycroft bp->b_flags |= B_READ;
642 1.97 hannken bp->b_flags &= ~B_COWDONE; /* we change blkno below */
643 1.1 mycroft if (bp->b_bcount > bp->b_bufsize)
644 1.1 mycroft panic("ffs_indirtrunc: bad buffer size");
645 1.1 mycroft bp->b_blkno = dbn;
646 1.61 yamt BIO_SETPRIO(bp, BPRIO_TIMECRITICAL);
647 1.62 hannken VOP_STRATEGY(vp, bp);
648 1.1 mycroft error = biowait(bp);
649 1.97 hannken if (error == 0)
650 1.97 hannken error = fscow_run(bp, true);
651 1.1 mycroft }
652 1.1 mycroft if (error) {
653 1.89 ad brelse(bp, 0);
654 1.118 jdolecek return error;
655 1.1 mycroft }
656 1.1 mycroft
657 1.121 jdolecek /*
658 1.121 jdolecek * Clear reference to blocks to be removed on disk, before actually
659 1.121 jdolecek * reclaiming them, so that fsck is more likely to be able to recover
660 1.121 jdolecek * the filesystem if system goes down during the truncate process.
661 1.121 jdolecek * This assumes the truncate process would not fail, contrary
662 1.121 jdolecek * to the wapbl case.
663 1.121 jdolecek */
664 1.123 hannken if (ip->i_ump->um_fstype == UFS1)
665 1.123 hannken bap1 = (int32_t *)bp->b_data;
666 1.123 hannken else
667 1.123 hannken bap2 = (int64_t *)bp->b_data;
668 1.121 jdolecek if (lastbn >= 0 && !wapbl) {
669 1.121 jdolecek copy = kmem_alloc(fs->fs_bsize, KM_SLEEP);
670 1.121 jdolecek memcpy((void *)copy, bp->b_data, (u_int)fs->fs_bsize);
671 1.121 jdolecek for (i = last + 1; i < FFS_NINDIR(fs); i++)
672 1.121 jdolecek BAP_ASSIGN(ip, i, 0);
673 1.121 jdolecek error = bwrite(bp);
674 1.121 jdolecek if (error)
675 1.121 jdolecek allerror = error;
676 1.121 jdolecek
677 1.121 jdolecek if (ip->i_ump->um_fstype == UFS1)
678 1.121 jdolecek bap1 = (int32_t *)copy;
679 1.121 jdolecek else
680 1.121 jdolecek bap2 = (int64_t *)copy;
681 1.121 jdolecek }
682 1.1 mycroft
683 1.1 mycroft /*
684 1.121 jdolecek * Recursively free totally unused blocks.
685 1.1 mycroft */
686 1.113 dholland for (i = FFS_NINDIR(fs) - 1, nlbn = lbn + 1 - i * factor; i > last;
687 1.1 mycroft i--, nlbn += factor) {
688 1.55 fvdl nb = RBAP(ip, i);
689 1.1 mycroft if (nb == 0)
690 1.1 mycroft continue;
691 1.118 jdolecek
692 1.122 jdolecek if ((ip->i_ump->um_mountp->mnt_wapbl) &&
693 1.122 jdolecek ((level > SINGLE) || (ITOV(ip)->v_type != VREG))) {
694 1.122 jdolecek error = UFS_WAPBL_REGISTER_DEALLOCATION(
695 1.122 jdolecek ip->i_ump->um_mountp,
696 1.122 jdolecek FFS_FSBTODB(fs, nb), fs->fs_bsize,
697 1.122 jdolecek &dcookie);
698 1.122 jdolecek if (error)
699 1.122 jdolecek goto out;
700 1.122 jdolecek } else {
701 1.122 jdolecek dcookie = NULL;
702 1.122 jdolecek }
703 1.122 jdolecek
704 1.1 mycroft if (level > SINGLE) {
705 1.114 dholland error = ffs_indirtrunc(ip, nlbn, FFS_FSBTODB(fs, nb),
706 1.118 jdolecek (daddr_t)-1, level - 1, countp);
707 1.122 jdolecek if (error) {
708 1.122 jdolecek if (dcookie) {
709 1.122 jdolecek UFS_WAPBL_UNREGISTER_DEALLOCATION(
710 1.122 jdolecek ip->i_ump->um_mountp, dcookie);
711 1.122 jdolecek }
712 1.122 jdolecek
713 1.118 jdolecek goto out;
714 1.122 jdolecek }
715 1.1 mycroft }
716 1.118 jdolecek
717 1.122 jdolecek if (!dcookie)
718 1.98 simonb ffs_blkfree(fs, ip->i_devvp, nb, fs->fs_bsize,
719 1.98 simonb ip->i_number);
720 1.118 jdolecek
721 1.118 jdolecek BAP_ASSIGN(ip, i, 0);
722 1.118 jdolecek *countp += nblocks;
723 1.1 mycroft }
724 1.1 mycroft
725 1.1 mycroft /*
726 1.118 jdolecek * Recursively free blocks on the now last partial indirect block.
727 1.1 mycroft */
728 1.1 mycroft if (level > SINGLE && lastbn >= 0) {
729 1.119 jdolecek last = lastbn % factor;
730 1.119 jdolecek nb = RBAP(ip, i);
731 1.1 mycroft if (nb != 0) {
732 1.114 dholland error = ffs_indirtrunc(ip, nlbn, FFS_FSBTODB(fs, nb),
733 1.119 jdolecek last, level - 1, countp);
734 1.9 christos if (error)
735 1.118 jdolecek goto out;
736 1.1 mycroft }
737 1.1 mycroft }
738 1.12 thorpej
739 1.118 jdolecek out:
740 1.121 jdolecek if (error && !allerror)
741 1.121 jdolecek allerror = error;
742 1.121 jdolecek
743 1.121 jdolecek if (copy != NULL) {
744 1.121 jdolecek kmem_free(copy, fs->fs_bsize);
745 1.121 jdolecek } else if (lastbn < 0 && error == 0) {
746 1.118 jdolecek /* all freed, release without writing back */
747 1.118 jdolecek brelse(bp, BC_INVAL);
748 1.121 jdolecek } else if (wapbl) {
749 1.121 jdolecek /* only partially freed, write the updated block */
750 1.121 jdolecek error = bwrite(bp);
751 1.121 jdolecek if (!allerror)
752 1.121 jdolecek allerror = error;
753 1.12 thorpej }
754 1.12 thorpej
755 1.121 jdolecek return (allerror);
756 1.1 mycroft }
757 1.74 drochner
758 1.74 drochner void
759 1.74 drochner ffs_itimes(struct inode *ip, const struct timespec *acc,
760 1.74 drochner const struct timespec *mod, const struct timespec *cre)
761 1.74 drochner {
762 1.82 kardel struct timespec now;
763 1.75 christos
764 1.76 yamt if (!(ip->i_flag & (IN_ACCESS | IN_CHANGE | IN_UPDATE | IN_MODIFY))) {
765 1.76 yamt return;
766 1.76 yamt }
767 1.75 christos
768 1.83 yamt vfs_timestamp(&now);
769 1.74 drochner if (ip->i_flag & IN_ACCESS) {
770 1.74 drochner if (acc == NULL)
771 1.82 kardel acc = &now;
772 1.74 drochner DIP_ASSIGN(ip, atime, acc->tv_sec);
773 1.74 drochner DIP_ASSIGN(ip, atimensec, acc->tv_nsec);
774 1.74 drochner }
775 1.74 drochner if (ip->i_flag & (IN_UPDATE | IN_MODIFY)) {
776 1.74 drochner if ((ip->i_flags & SF_SNAPSHOT) == 0) {
777 1.74 drochner if (mod == NULL)
778 1.82 kardel mod = &now;
779 1.74 drochner DIP_ASSIGN(ip, mtime, mod->tv_sec);
780 1.74 drochner DIP_ASSIGN(ip, mtimensec, mod->tv_nsec);
781 1.74 drochner }
782 1.74 drochner ip->i_modrev++;
783 1.74 drochner }
784 1.74 drochner if (ip->i_flag & (IN_CHANGE | IN_MODIFY)) {
785 1.74 drochner if (cre == NULL)
786 1.82 kardel cre = &now;
787 1.74 drochner DIP_ASSIGN(ip, ctime, cre->tv_sec);
788 1.74 drochner DIP_ASSIGN(ip, ctimensec, cre->tv_nsec);
789 1.74 drochner }
790 1.74 drochner if (ip->i_flag & (IN_ACCESS | IN_MODIFY))
791 1.74 drochner ip->i_flag |= IN_ACCESSED;
792 1.74 drochner if (ip->i_flag & (IN_UPDATE | IN_CHANGE))
793 1.74 drochner ip->i_flag |= IN_MODIFIED;
794 1.74 drochner ip->i_flag &= ~(IN_ACCESS | IN_CHANGE | IN_UPDATE | IN_MODIFY);
795 1.74 drochner }
796