ffs_balloc.c revision 1.13.2.1 1 1.13.2.1 chs /* $NetBSD: ffs_balloc.c,v 1.13.2.1 1998/11/09 06:06:35 chs Exp $ */
2 1.2 cgd
3 1.1 mycroft /*
4 1.1 mycroft * Copyright (c) 1982, 1986, 1989, 1993
5 1.1 mycroft * The Regents of the University of California. All rights reserved.
6 1.1 mycroft *
7 1.1 mycroft * Redistribution and use in source and binary forms, with or without
8 1.1 mycroft * modification, are permitted provided that the following conditions
9 1.1 mycroft * are met:
10 1.1 mycroft * 1. Redistributions of source code must retain the above copyright
11 1.1 mycroft * notice, this list of conditions and the following disclaimer.
12 1.1 mycroft * 2. Redistributions in binary form must reproduce the above copyright
13 1.1 mycroft * notice, this list of conditions and the following disclaimer in the
14 1.1 mycroft * documentation and/or other materials provided with the distribution.
15 1.1 mycroft * 3. All advertising materials mentioning features or use of this software
16 1.1 mycroft * must display the following acknowledgement:
17 1.1 mycroft * This product includes software developed by the University of
18 1.1 mycroft * California, Berkeley and its contributors.
19 1.1 mycroft * 4. Neither the name of the University nor the names of its contributors
20 1.1 mycroft * may be used to endorse or promote products derived from this software
21 1.1 mycroft * without specific prior written permission.
22 1.1 mycroft *
23 1.1 mycroft * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
24 1.1 mycroft * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25 1.1 mycroft * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26 1.1 mycroft * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
27 1.1 mycroft * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
28 1.1 mycroft * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
29 1.1 mycroft * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
30 1.1 mycroft * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
31 1.1 mycroft * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
32 1.1 mycroft * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
33 1.1 mycroft * SUCH DAMAGE.
34 1.1 mycroft *
35 1.8 fvdl * @(#)ffs_balloc.c 8.8 (Berkeley) 6/16/95
36 1.1 mycroft */
37 1.7 mrg
38 1.11 scottr #if defined(_KERNEL) && !defined(_LKM)
39 1.10 scottr #include "opt_quota.h"
40 1.7 mrg #include "opt_uvm.h"
41 1.11 scottr #endif
42 1.1 mycroft
43 1.1 mycroft #include <sys/param.h>
44 1.1 mycroft #include <sys/systm.h>
45 1.1 mycroft #include <sys/buf.h>
46 1.1 mycroft #include <sys/proc.h>
47 1.1 mycroft #include <sys/file.h>
48 1.1 mycroft #include <sys/vnode.h>
49 1.9 bouyer #include <sys/mount.h>
50 1.1 mycroft
51 1.1 mycroft #include <vm/vm.h>
52 1.1 mycroft
53 1.6 mrg #if defined(UVM)
54 1.13.2.1 chs #include <uvm/uvm.h>
55 1.6 mrg #endif
56 1.6 mrg
57 1.1 mycroft #include <ufs/ufs/quota.h>
58 1.9 bouyer #include <ufs/ufs/ufsmount.h>
59 1.1 mycroft #include <ufs/ufs/inode.h>
60 1.1 mycroft #include <ufs/ufs/ufs_extern.h>
61 1.9 bouyer #include <ufs/ufs/ufs_bswap.h>
62 1.1 mycroft
63 1.1 mycroft #include <ufs/ffs/fs.h>
64 1.1 mycroft #include <ufs/ffs/ffs_extern.h>
65 1.1 mycroft
66 1.1 mycroft /*
67 1.1 mycroft * Balloc defines the structure of file system storage
68 1.1 mycroft * by allocating the physical blocks on a device given
69 1.1 mycroft * the inode and the logical block number in a file.
70 1.1 mycroft */
71 1.3 christos int
72 1.8 fvdl ffs_balloc(ip, lbn, size, cred, bpp, flags)
73 1.1 mycroft register struct inode *ip;
74 1.8 fvdl register ufs_daddr_t lbn;
75 1.1 mycroft int size;
76 1.1 mycroft struct ucred *cred;
77 1.1 mycroft struct buf **bpp;
78 1.1 mycroft int flags;
79 1.1 mycroft {
80 1.1 mycroft register struct fs *fs;
81 1.8 fvdl register ufs_daddr_t nb;
82 1.1 mycroft struct buf *bp, *nbp;
83 1.1 mycroft struct vnode *vp = ITOV(ip);
84 1.1 mycroft struct indir indirs[NIADDR + 2];
85 1.8 fvdl ufs_daddr_t newb, *bap, pref;
86 1.8 fvdl int deallocated, osize, nsize, num, i, error;
87 1.8 fvdl ufs_daddr_t *allocib, *blkp, *allocblk, allociblk[NIADDR + 1];
88 1.1 mycroft
89 1.13.2.1 chs if (bpp != NULL) {
90 1.13.2.1 chs *bpp = NULL;
91 1.13.2.1 chs }
92 1.13.2.1 chs
93 1.8 fvdl if (lbn < 0)
94 1.1 mycroft return (EFBIG);
95 1.1 mycroft fs = ip->i_fs;
96 1.1 mycroft
97 1.1 mycroft /*
98 1.13.2.1 chs * If the file currently ends with a fragment and
99 1.13.2.1 chs * the block we're allocating now is after the current EOF,
100 1.1 mycroft * this fragment has to be extended to be a full block.
101 1.1 mycroft */
102 1.4 bouyer nb = lblkno(fs, ip->i_ffs_size);
103 1.8 fvdl if (nb < NDADDR && nb < lbn) {
104 1.1 mycroft osize = blksize(fs, ip, nb);
105 1.1 mycroft if (osize < fs->fs_bsize && osize > 0) {
106 1.1 mycroft error = ffs_realloccg(ip, nb,
107 1.4 bouyer ffs_blkpref(ip, nb, (int)nb, &ip->i_ffs_db[0]),
108 1.13.2.1 chs osize, (int)fs->fs_bsize, cred, bpp, &newb);
109 1.1 mycroft if (error)
110 1.1 mycroft return (error);
111 1.13.2.1 chs ip->i_ffs_size = lblktosize(fs, nb + 1);
112 1.6 mrg #if defined(UVM)
113 1.6 mrg uvm_vnp_setsize(vp, ip->i_ffs_size);
114 1.6 mrg #else
115 1.5 drochner vnode_pager_setsize(vp, ip->i_ffs_size);
116 1.6 mrg #endif
117 1.13.2.1 chs ip->i_ffs_db[nb] = ufs_rw32(newb,
118 1.12 kleink UFS_MPNEEDSWAP(vp->v_mount));
119 1.1 mycroft ip->i_flag |= IN_CHANGE | IN_UPDATE;
120 1.13.2.1 chs
121 1.13.2.1 chs if (bpp) {
122 1.13.2.1 chs if (flags & B_SYNC)
123 1.13.2.1 chs bwrite(*bpp);
124 1.13.2.1 chs else
125 1.13.2.1 chs bawrite(*bpp);
126 1.13.2.1 chs }
127 1.13.2.1 chs else {
128 1.13.2.1 chs /*
129 1.13.2.1 chs * XXX the data in the frag might be
130 1.13.2.1 chs * moving to a new disk location.
131 1.13.2.1 chs * we need to flush pages to the
132 1.13.2.1 chs * new disk locations.
133 1.13.2.1 chs * XXX we could do this in realloccg
134 1.13.2.1 chs * except for the sync flag.
135 1.13.2.1 chs */
136 1.13.2.1 chs (vp->v_uvm.u_obj.pgops->pgo_flush)
137 1.13.2.1 chs (&vp->v_uvm.u_obj, lblktosize(fs, nb),
138 1.13.2.1 chs lblktosize(fs, nb + 1),
139 1.13.2.1 chs flags & B_SYNC ? PGO_SYNCIO : 0);
140 1.13.2.1 chs }
141 1.1 mycroft }
142 1.1 mycroft }
143 1.1 mycroft /*
144 1.1 mycroft * The first NDADDR blocks are direct blocks
145 1.1 mycroft */
146 1.8 fvdl if (lbn < NDADDR) {
147 1.13.2.1 chs
148 1.9 bouyer nb = ufs_rw32(ip->i_ffs_db[lbn], UFS_MPNEEDSWAP(vp->v_mount));
149 1.13.2.1 chs if (nb != 0 && ip->i_ffs_size >= lblktosize(fs, lbn + 1)) {
150 1.13.2.1 chs
151 1.13.2.1 chs /*
152 1.13.2.1 chs * the block is an already-allocated direct block
153 1.13.2.1 chs * and the file already extends past this block,
154 1.13.2.1 chs * thus this must be a whole block.
155 1.13.2.1 chs * just read the block (if requested).
156 1.13.2.1 chs */
157 1.13.2.1 chs
158 1.13.2.1 chs justread:
159 1.13.2.1 chs if (bpp != NULL) {
160 1.13.2.1 chs error = bread(vp, lbn, fs->fs_bsize, NOCRED,
161 1.13.2.1 chs &bp);
162 1.13.2.1 chs if (error) {
163 1.13.2.1 chs brelse(bp);
164 1.13.2.1 chs return (error);
165 1.13.2.1 chs }
166 1.13.2.1 chs *bpp = bp;
167 1.1 mycroft }
168 1.1 mycroft return (0);
169 1.1 mycroft }
170 1.1 mycroft if (nb != 0) {
171 1.1 mycroft /*
172 1.1 mycroft * Consider need to reallocate a fragment.
173 1.1 mycroft */
174 1.4 bouyer osize = fragroundup(fs, blkoff(fs, ip->i_ffs_size));
175 1.1 mycroft nsize = fragroundup(fs, size);
176 1.1 mycroft if (nsize <= osize) {
177 1.13.2.1 chs
178 1.13.2.1 chs /*
179 1.13.2.1 chs * the existing block is already
180 1.13.2.1 chs * at least as big as we want.
181 1.13.2.1 chs * just read the block (if requested).
182 1.13.2.1 chs */
183 1.13.2.1 chs
184 1.13.2.1 chs goto justread;
185 1.1 mycroft } else {
186 1.13.2.1 chs
187 1.13.2.1 chs /*
188 1.13.2.1 chs * the existing block is smaller than we want,
189 1.13.2.1 chs * grow it.
190 1.13.2.1 chs */
191 1.13.2.1 chs
192 1.8 fvdl error = ffs_realloccg(ip, lbn,
193 1.8 fvdl ffs_blkpref(ip, lbn, (int)lbn,
194 1.8 fvdl &ip->i_ffs_db[0]), osize, nsize, cred,
195 1.13.2.1 chs bpp, &newb);
196 1.1 mycroft if (error)
197 1.1 mycroft return (error);
198 1.13.2.1 chs ip->i_ffs_db[lbn] = ufs_rw32(newb,
199 1.13.2.1 chs UFS_MPNEEDSWAP(vp->v_mount));
200 1.13.2.1 chs ip->i_flag |= IN_CHANGE | IN_UPDATE;
201 1.1 mycroft }
202 1.1 mycroft } else {
203 1.13.2.1 chs
204 1.13.2.1 chs /*
205 1.13.2.1 chs * the block was not previously allocated,
206 1.13.2.1 chs * allocate a new block or fragment.
207 1.13.2.1 chs */
208 1.13.2.1 chs
209 1.13.2.1 chs if (ip->i_ffs_size < lblktosize(fs, lbn + 1))
210 1.1 mycroft nsize = fragroundup(fs, size);
211 1.1 mycroft else
212 1.1 mycroft nsize = fs->fs_bsize;
213 1.8 fvdl error = ffs_alloc(ip, lbn,
214 1.8 fvdl ffs_blkpref(ip, lbn, (int)lbn, &ip->i_ffs_db[0]),
215 1.8 fvdl nsize, cred, &newb);
216 1.1 mycroft if (error)
217 1.1 mycroft return (error);
218 1.13.2.1 chs
219 1.13.2.1 chs ip->i_ffs_db[lbn] = ufs_rw32(newb,
220 1.13.2.1 chs UFS_MPNEEDSWAP(vp->v_mount));
221 1.13.2.1 chs ip->i_flag |= IN_CHANGE | IN_UPDATE;
222 1.13.2.1 chs
223 1.13.2.1 chs if (bpp != NULL) {
224 1.13.2.1 chs bp = getblk(vp, lbn, nsize, 0, 0);
225 1.13.2.1 chs bp->b_blkno = fsbtodb(fs, newb);
226 1.13.2.1 chs if (flags & B_CLRBUF)
227 1.13.2.1 chs clrbuf(bp);
228 1.13.2.1 chs *bpp = bp;
229 1.13.2.1 chs }
230 1.1 mycroft }
231 1.1 mycroft return (0);
232 1.1 mycroft }
233 1.1 mycroft /*
234 1.1 mycroft * Determine the number of levels of indirection.
235 1.1 mycroft */
236 1.1 mycroft pref = 0;
237 1.8 fvdl if ((error = ufs_getlbns(vp, lbn, indirs, &num)) != 0)
238 1.1 mycroft return(error);
239 1.1 mycroft #ifdef DIAGNOSTIC
240 1.1 mycroft if (num < 1)
241 1.1 mycroft panic ("ffs_balloc: ufs_bmaparray returned indirect block\n");
242 1.1 mycroft #endif
243 1.1 mycroft /*
244 1.1 mycroft * Fetch the first indirect block allocating if necessary.
245 1.1 mycroft */
246 1.1 mycroft --num;
247 1.9 bouyer nb = ufs_rw32(ip->i_ffs_ib[indirs[0].in_off],
248 1.12 kleink UFS_MPNEEDSWAP(vp->v_mount));
249 1.8 fvdl allocib = NULL;
250 1.8 fvdl allocblk = allociblk;
251 1.1 mycroft if (nb == 0) {
252 1.8 fvdl pref = ffs_blkpref(ip, lbn, 0, (ufs_daddr_t *)0);
253 1.9 bouyer error = ffs_alloc(ip, lbn, pref, (int)fs->fs_bsize,
254 1.9 bouyer cred, &newb);
255 1.3 christos if (error)
256 1.1 mycroft return (error);
257 1.1 mycroft nb = newb;
258 1.8 fvdl *allocblk++ = nb;
259 1.1 mycroft bp = getblk(vp, indirs[1].in_lbn, fs->fs_bsize, 0, 0);
260 1.8 fvdl bp->b_blkno = fsbtodb(fs, nb);
261 1.1 mycroft clrbuf(bp);
262 1.1 mycroft /*
263 1.1 mycroft * Write synchronously so that indirect blocks
264 1.1 mycroft * never point at garbage.
265 1.1 mycroft */
266 1.8 fvdl if ((error = bwrite(bp)) != 0)
267 1.8 fvdl goto fail;
268 1.8 fvdl allocib = &ip->i_ffs_ib[indirs[0].in_off];
269 1.9 bouyer *allocib = ufs_rw32(nb, UFS_MPNEEDSWAP(vp->v_mount));
270 1.1 mycroft ip->i_flag |= IN_CHANGE | IN_UPDATE;
271 1.1 mycroft }
272 1.1 mycroft /*
273 1.1 mycroft * Fetch through the indirect blocks, allocating as necessary.
274 1.1 mycroft */
275 1.1 mycroft for (i = 1;;) {
276 1.1 mycroft error = bread(vp,
277 1.1 mycroft indirs[i].in_lbn, (int)fs->fs_bsize, NOCRED, &bp);
278 1.1 mycroft if (error) {
279 1.1 mycroft brelse(bp);
280 1.8 fvdl goto fail;
281 1.1 mycroft }
282 1.8 fvdl bap = (ufs_daddr_t *)bp->b_data;
283 1.12 kleink nb = ufs_rw32(bap[indirs[i].in_off],
284 1.12 kleink UFS_MPNEEDSWAP(vp->v_mount));
285 1.1 mycroft if (i == num)
286 1.1 mycroft break;
287 1.1 mycroft i += 1;
288 1.1 mycroft if (nb != 0) {
289 1.1 mycroft brelse(bp);
290 1.1 mycroft continue;
291 1.1 mycroft }
292 1.1 mycroft if (pref == 0)
293 1.8 fvdl pref = ffs_blkpref(ip, lbn, 0, (ufs_daddr_t *)0);
294 1.3 christos error = ffs_alloc(ip, lbn, pref, (int)fs->fs_bsize, cred,
295 1.3 christos &newb);
296 1.3 christos if (error) {
297 1.1 mycroft brelse(bp);
298 1.8 fvdl goto fail;
299 1.1 mycroft }
300 1.1 mycroft nb = newb;
301 1.8 fvdl *allocblk++ = nb;
302 1.1 mycroft nbp = getblk(vp, indirs[i].in_lbn, fs->fs_bsize, 0, 0);
303 1.1 mycroft nbp->b_blkno = fsbtodb(fs, nb);
304 1.1 mycroft clrbuf(nbp);
305 1.1 mycroft /*
306 1.1 mycroft * Write synchronously so that indirect blocks
307 1.1 mycroft * never point at garbage.
308 1.1 mycroft */
309 1.3 christos if ((error = bwrite(nbp)) != 0) {
310 1.1 mycroft brelse(bp);
311 1.8 fvdl goto fail;
312 1.1 mycroft }
313 1.9 bouyer bap[indirs[i - 1].in_off] = ufs_rw32(nb,
314 1.12 kleink UFS_MPNEEDSWAP(vp->v_mount));
315 1.1 mycroft /*
316 1.1 mycroft * If required, write synchronously, otherwise use
317 1.1 mycroft * delayed write.
318 1.1 mycroft */
319 1.1 mycroft if (flags & B_SYNC) {
320 1.1 mycroft bwrite(bp);
321 1.1 mycroft } else {
322 1.1 mycroft bdwrite(bp);
323 1.1 mycroft }
324 1.1 mycroft }
325 1.1 mycroft /*
326 1.1 mycroft * Get the data block, allocating if necessary.
327 1.1 mycroft */
328 1.1 mycroft if (nb == 0) {
329 1.1 mycroft pref = ffs_blkpref(ip, lbn, indirs[i].in_off, &bap[0]);
330 1.3 christos error = ffs_alloc(ip, lbn, pref, (int)fs->fs_bsize, cred,
331 1.3 christos &newb);
332 1.3 christos if (error) {
333 1.1 mycroft brelse(bp);
334 1.8 fvdl goto fail;
335 1.1 mycroft }
336 1.1 mycroft nb = newb;
337 1.8 fvdl *allocblk++ = nb;
338 1.12 kleink bap[indirs[i].in_off] = ufs_rw32(nb,
339 1.12 kleink UFS_MPNEEDSWAP(vp->v_mount));
340 1.1 mycroft /*
341 1.1 mycroft * If required, write synchronously, otherwise use
342 1.1 mycroft * delayed write.
343 1.1 mycroft */
344 1.1 mycroft if (flags & B_SYNC) {
345 1.1 mycroft bwrite(bp);
346 1.1 mycroft } else {
347 1.1 mycroft bdwrite(bp);
348 1.1 mycroft }
349 1.13.2.1 chs if (bpp != NULL) {
350 1.13.2.1 chs nbp = getblk(vp, lbn, fs->fs_bsize, 0, 0);
351 1.13.2.1 chs nbp->b_blkno = fsbtodb(fs, nb);
352 1.13.2.1 chs if (flags & B_CLRBUF)
353 1.13.2.1 chs clrbuf(nbp);
354 1.13.2.1 chs *bpp = nbp;
355 1.13.2.1 chs }
356 1.1 mycroft return (0);
357 1.1 mycroft }
358 1.13.2.1 chs
359 1.1 mycroft brelse(bp);
360 1.13.2.1 chs
361 1.13.2.1 chs if (bpp != NULL) {
362 1.13.2.1 chs if (flags & B_CLRBUF) {
363 1.13.2.1 chs error = bread(vp, lbn, (int)fs->fs_bsize, NOCRED, &nbp);
364 1.13.2.1 chs if (error) {
365 1.13.2.1 chs brelse(nbp);
366 1.13.2.1 chs goto fail;
367 1.13.2.1 chs }
368 1.13.2.1 chs } else {
369 1.13.2.1 chs nbp = getblk(vp, lbn, fs->fs_bsize, 0, 0);
370 1.13.2.1 chs nbp->b_blkno = fsbtodb(fs, nb);
371 1.13.2.1 chs clrbuf(nbp);
372 1.1 mycroft }
373 1.13.2.1 chs *bpp = nbp;
374 1.1 mycroft }
375 1.13.2.1 chs
376 1.1 mycroft return (0);
377 1.8 fvdl fail:
378 1.8 fvdl /*
379 1.8 fvdl * If we have failed part way through block allocation, we
380 1.8 fvdl * have to deallocate any indirect blocks that we have allocated.
381 1.8 fvdl */
382 1.8 fvdl for (deallocated = 0, blkp = allociblk; blkp < allocblk; blkp++) {
383 1.8 fvdl ffs_blkfree(ip, *blkp, fs->fs_bsize);
384 1.8 fvdl deallocated += fs->fs_bsize;
385 1.8 fvdl }
386 1.8 fvdl if (allocib != NULL)
387 1.8 fvdl *allocib = 0;
388 1.8 fvdl if (deallocated) {
389 1.8 fvdl #ifdef QUOTA
390 1.8 fvdl /*
391 1.8 fvdl * Restore user's disk quota because allocation failed.
392 1.8 fvdl */
393 1.8 fvdl (void)chkdq(ip, (long)-btodb(deallocated), cred, FORCE);
394 1.8 fvdl #endif
395 1.8 fvdl ip->i_ffs_blocks -= btodb(deallocated);
396 1.13 mycroft ip->i_flag |= IN_CHANGE | IN_UPDATE;
397 1.8 fvdl }
398 1.8 fvdl return (error);
399 1.1 mycroft }
400