ext2fs_alloc.c revision 1.52 1 1.52 hannken /* $NetBSD: ext2fs_alloc.c,v 1.52 2017/05/28 16:38:55 hannken Exp $ */
2 1.1 bouyer
3 1.1 bouyer /*
4 1.1 bouyer * Copyright (c) 1982, 1986, 1989, 1993
5 1.1 bouyer * The Regents of the University of California. All rights reserved.
6 1.1 bouyer *
7 1.1 bouyer * Redistribution and use in source and binary forms, with or without
8 1.1 bouyer * modification, are permitted provided that the following conditions
9 1.1 bouyer * are met:
10 1.1 bouyer * 1. Redistributions of source code must retain the above copyright
11 1.1 bouyer * notice, this list of conditions and the following disclaimer.
12 1.1 bouyer * 2. Redistributions in binary form must reproduce the above copyright
13 1.1 bouyer * notice, this list of conditions and the following disclaimer in the
14 1.1 bouyer * documentation and/or other materials provided with the distribution.
15 1.20 agc * 3. Neither the name of the University nor the names of its contributors
16 1.20 agc * may be used to endorse or promote products derived from this software
17 1.20 agc * without specific prior written permission.
18 1.20 agc *
19 1.20 agc * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
20 1.20 agc * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21 1.20 agc * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22 1.20 agc * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
23 1.20 agc * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24 1.20 agc * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25 1.20 agc * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26 1.20 agc * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27 1.20 agc * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28 1.20 agc * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 1.20 agc * SUCH DAMAGE.
30 1.20 agc *
31 1.20 agc * @(#)ffs_alloc.c 8.11 (Berkeley) 10/27/94
32 1.20 agc * Modified for ext2fs by Manuel Bouyer.
33 1.20 agc */
34 1.20 agc
35 1.20 agc /*
36 1.20 agc * Copyright (c) 1997 Manuel Bouyer.
37 1.20 agc *
38 1.20 agc * Redistribution and use in source and binary forms, with or without
39 1.20 agc * modification, are permitted provided that the following conditions
40 1.20 agc * are met:
41 1.20 agc * 1. Redistributions of source code must retain the above copyright
42 1.20 agc * notice, this list of conditions and the following disclaimer.
43 1.20 agc * 2. Redistributions in binary form must reproduce the above copyright
44 1.20 agc * notice, this list of conditions and the following disclaimer in the
45 1.20 agc * documentation and/or other materials provided with the distribution.
46 1.1 bouyer *
47 1.22 bouyer * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
48 1.22 bouyer * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
49 1.22 bouyer * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
50 1.22 bouyer * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
51 1.22 bouyer * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
52 1.22 bouyer * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
53 1.22 bouyer * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
54 1.22 bouyer * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
55 1.22 bouyer * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
56 1.22 bouyer * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
57 1.1 bouyer *
58 1.1 bouyer * @(#)ffs_alloc.c 8.11 (Berkeley) 10/27/94
59 1.1 bouyer * Modified for ext2fs by Manuel Bouyer.
60 1.1 bouyer */
61 1.13 lukem
62 1.13 lukem #include <sys/cdefs.h>
63 1.52 hannken __KERNEL_RCSID(0, "$NetBSD: ext2fs_alloc.c,v 1.52 2017/05/28 16:38:55 hannken Exp $");
64 1.1 bouyer
65 1.1 bouyer #include <sys/param.h>
66 1.1 bouyer #include <sys/systm.h>
67 1.1 bouyer #include <sys/buf.h>
68 1.1 bouyer #include <sys/proc.h>
69 1.1 bouyer #include <sys/vnode.h>
70 1.1 bouyer #include <sys/mount.h>
71 1.1 bouyer #include <sys/kernel.h>
72 1.1 bouyer #include <sys/syslog.h>
73 1.29 elad #include <sys/kauth.h>
74 1.1 bouyer
75 1.49 jdolecek #include <lib/libkern/crc16.h>
76 1.49 jdolecek
77 1.1 bouyer #include <ufs/ufs/inode.h>
78 1.1 bouyer #include <ufs/ufs/ufs_extern.h>
79 1.27 yamt #include <ufs/ufs/ufsmount.h>
80 1.1 bouyer
81 1.1 bouyer #include <ufs/ext2fs/ext2fs.h>
82 1.1 bouyer #include <ufs/ext2fs/ext2fs_extern.h>
83 1.1 bouyer
84 1.1 bouyer u_long ext2gennumber;
85 1.1 bouyer
86 1.26 xtraeme static daddr_t ext2fs_alloccg(struct inode *, int, daddr_t, int);
87 1.26 xtraeme static u_long ext2fs_dirpref(struct m_ext2fs *);
88 1.26 xtraeme static void ext2fs_fserr(struct m_ext2fs *, u_int, const char *);
89 1.26 xtraeme static u_long ext2fs_hashalloc(struct inode *, int, long, int,
90 1.40 tsutsui daddr_t (*)(struct inode *, int, daddr_t, int));
91 1.26 xtraeme static daddr_t ext2fs_nodealloccg(struct inode *, int, daddr_t, int);
92 1.26 xtraeme static daddr_t ext2fs_mapsearch(struct m_ext2fs *, char *, daddr_t);
93 1.49 jdolecek static __inline void ext2fs_cg_update(struct m_ext2fs *, int, struct ext2_gd *, int, int, int, daddr_t);
94 1.49 jdolecek static uint16_t ext2fs_cg_get_csum(struct m_ext2fs *, int, struct ext2_gd *);
95 1.49 jdolecek static void ext2fs_init_bb(struct m_ext2fs *, int, struct ext2_gd *, char *);
96 1.1 bouyer
97 1.1 bouyer /*
98 1.1 bouyer * Allocate a block in the file system.
99 1.23 perry *
100 1.1 bouyer * A preference may be optionally specified. If a preference is given
101 1.1 bouyer * the following hierarchy is used to allocate a block:
102 1.1 bouyer * 1) allocate the requested block.
103 1.1 bouyer * 2) allocate a rotationally optimal block in the same cylinder.
104 1.1 bouyer * 3) allocate a block in the same cylinder group.
105 1.1 bouyer * 4) quadradically rehash into other cylinder groups, until an
106 1.1 bouyer * available block is located.
107 1.11 wiz * If no block preference is given the following hierarchy is used
108 1.1 bouyer * to allocate a block:
109 1.1 bouyer * 1) allocate a block in the cylinder group that contains the
110 1.1 bouyer * inode for the file.
111 1.1 bouyer * 2) quadradically rehash into other cylinder groups, until an
112 1.1 bouyer * available block is located.
113 1.1 bouyer */
114 1.1 bouyer int
115 1.32 christos ext2fs_alloc(struct inode *ip, daddr_t lbn, daddr_t bpref,
116 1.31 christos kauth_cred_t cred, daddr_t *bnp)
117 1.1 bouyer {
118 1.7 augustss struct m_ext2fs *fs;
119 1.15 fvdl daddr_t bno;
120 1.1 bouyer int cg;
121 1.23 perry
122 1.1 bouyer *bnp = 0;
123 1.1 bouyer fs = ip->i_e2fs;
124 1.1 bouyer #ifdef DIAGNOSTIC
125 1.1 bouyer if (cred == NOCRED)
126 1.14 provos panic("ext2fs_alloc: missing credential");
127 1.1 bouyer #endif /* DIAGNOSTIC */
128 1.1 bouyer if (fs->e2fs.e2fs_fbcount == 0)
129 1.1 bouyer goto nospace;
130 1.39 elad if (kauth_authorize_system(cred, KAUTH_SYSTEM_FS_RESERVEDSPACE, 0, NULL,
131 1.39 elad NULL, NULL) != 0 &&
132 1.34 elad freespace(fs) <= 0)
133 1.1 bouyer goto nospace;
134 1.1 bouyer if (bpref >= fs->e2fs.e2fs_bcount)
135 1.1 bouyer bpref = 0;
136 1.1 bouyer if (bpref == 0)
137 1.1 bouyer cg = ino_to_cg(fs, ip->i_number);
138 1.1 bouyer else
139 1.1 bouyer cg = dtog(fs, bpref);
140 1.15 fvdl bno = (daddr_t)ext2fs_hashalloc(ip, cg, bpref, fs->e2fs_bsize,
141 1.40 tsutsui ext2fs_alloccg);
142 1.1 bouyer if (bno > 0) {
143 1.43 jakllsch ext2fs_setnblock(ip, ext2fs_nblock(ip) + btodb(fs->e2fs_bsize));
144 1.1 bouyer ip->i_flag |= IN_CHANGE | IN_UPDATE;
145 1.1 bouyer *bnp = bno;
146 1.48 christos return 0;
147 1.1 bouyer }
148 1.1 bouyer nospace:
149 1.29 elad ext2fs_fserr(fs, kauth_cred_geteuid(cred), "file system full");
150 1.1 bouyer uprintf("\n%s: write failed, file system is full\n", fs->e2fs_fsmnt);
151 1.48 christos return ENOSPC;
152 1.1 bouyer }
153 1.1 bouyer
154 1.1 bouyer /*
155 1.1 bouyer * Allocate an inode in the file system.
156 1.23 perry *
157 1.1 bouyer * If allocating a directory, use ext2fs_dirpref to select the inode.
158 1.1 bouyer * If allocating in a directory, the following hierarchy is followed:
159 1.1 bouyer * 1) allocate the preferred inode.
160 1.1 bouyer * 2) allocate an inode in the same cylinder group.
161 1.1 bouyer * 3) quadradically rehash into other cylinder groups, until an
162 1.1 bouyer * available inode is located.
163 1.11 wiz * If no inode preference is given the following hierarchy is used
164 1.1 bouyer * to allocate an inode:
165 1.1 bouyer * 1) allocate an inode in cylinder group 0.
166 1.1 bouyer * 2) quadradically rehash into other cylinder groups, until an
167 1.1 bouyer * available inode is located.
168 1.1 bouyer */
169 1.1 bouyer int
170 1.52 hannken ext2fs_valloc(struct vnode *pvp, int mode, kauth_cred_t cred, ino_t *inop)
171 1.1 bouyer {
172 1.7 augustss struct inode *pip;
173 1.7 augustss struct m_ext2fs *fs;
174 1.1 bouyer ino_t ino, ipref;
175 1.52 hannken int cg;
176 1.23 perry
177 1.1 bouyer pip = VTOI(pvp);
178 1.1 bouyer fs = pip->i_e2fs;
179 1.1 bouyer if (fs->e2fs.e2fs_ficount == 0)
180 1.1 bouyer goto noinodes;
181 1.1 bouyer
182 1.1 bouyer if ((mode & IFMT) == IFDIR)
183 1.1 bouyer cg = ext2fs_dirpref(fs);
184 1.1 bouyer else
185 1.1 bouyer cg = ino_to_cg(fs, pip->i_number);
186 1.1 bouyer ipref = cg * fs->e2fs.e2fs_ipg + 1;
187 1.1 bouyer ino = (ino_t)ext2fs_hashalloc(pip, cg, (long)ipref, mode, ext2fs_nodealloccg);
188 1.1 bouyer if (ino == 0)
189 1.1 bouyer goto noinodes;
190 1.49 jdolecek
191 1.52 hannken *inop = ino;
192 1.52 hannken return 0;
193 1.1 bouyer
194 1.1 bouyer noinodes:
195 1.29 elad ext2fs_fserr(fs, kauth_cred_geteuid(cred), "out of inodes");
196 1.1 bouyer uprintf("\n%s: create/symlink failed, no inodes free\n", fs->e2fs_fsmnt);
197 1.48 christos return ENOSPC;
198 1.1 bouyer }
199 1.1 bouyer
200 1.1 bouyer /*
201 1.1 bouyer * Find a cylinder to place a directory.
202 1.1 bouyer *
203 1.1 bouyer * The policy implemented by this algorithm is to select from
204 1.1 bouyer * among those cylinder groups with above the average number of
205 1.1 bouyer * free inodes, the one with the smallest number of directories.
206 1.1 bouyer */
207 1.1 bouyer static u_long
208 1.26 xtraeme ext2fs_dirpref(struct m_ext2fs *fs)
209 1.1 bouyer {
210 1.1 bouyer int cg, maxspace, mincg, avgifree;
211 1.1 bouyer
212 1.1 bouyer avgifree = fs->e2fs.e2fs_ficount / fs->e2fs_ncg;
213 1.1 bouyer maxspace = 0;
214 1.1 bouyer mincg = -1;
215 1.1 bouyer for (cg = 0; cg < fs->e2fs_ncg; cg++)
216 1.49 jdolecek if (fs2h16(fs->e2fs_gd[cg].ext2bgd_nifree) >= avgifree) {
217 1.49 jdolecek if (mincg == -1 || fs2h16(fs->e2fs_gd[cg].ext2bgd_nbfree) > maxspace) {
218 1.1 bouyer mincg = cg;
219 1.49 jdolecek maxspace = fs2h16(fs->e2fs_gd[cg].ext2bgd_nbfree);
220 1.1 bouyer }
221 1.1 bouyer }
222 1.1 bouyer return mincg;
223 1.1 bouyer }
224 1.1 bouyer
225 1.1 bouyer /*
226 1.1 bouyer * Select the desired position for the next block in a file. The file is
227 1.1 bouyer * logically divided into sections. The first section is composed of the
228 1.1 bouyer * direct blocks. Each additional section contains fs_maxbpg blocks.
229 1.23 perry *
230 1.1 bouyer * If no blocks have been allocated in the first section, the policy is to
231 1.1 bouyer * request a block in the same cylinder group as the inode that describes
232 1.1 bouyer * the file. Otherwise, the policy is to try to allocate the blocks
233 1.10 toshii * contigously. The two fields of the ext2 inode extension (see
234 1.1 bouyer * ufs/ufs/inode.h) help this.
235 1.1 bouyer */
236 1.15 fvdl daddr_t
237 1.26 xtraeme ext2fs_blkpref(struct inode *ip, daddr_t lbn, int indx,
238 1.26 xtraeme int32_t *bap /* XXX ondisk32 */)
239 1.1 bouyer {
240 1.7 augustss struct m_ext2fs *fs;
241 1.7 augustss int cg, i;
242 1.1 bouyer
243 1.1 bouyer fs = ip->i_e2fs;
244 1.1 bouyer /*
245 1.1 bouyer * if we are doing contigous lbn allocation, try to alloc blocks
246 1.1 bouyer * contigously on disk
247 1.1 bouyer */
248 1.1 bouyer
249 1.1 bouyer if ( ip->i_e2fs_last_blk && lbn == ip->i_e2fs_last_lblk + 1) {
250 1.1 bouyer return ip->i_e2fs_last_blk + 1;
251 1.1 bouyer }
252 1.1 bouyer
253 1.1 bouyer /*
254 1.1 bouyer * bap, if provided, gives us a list of blocks to which we want to
255 1.1 bouyer * stay close
256 1.1 bouyer */
257 1.1 bouyer
258 1.1 bouyer if (bap) {
259 1.1 bouyer for (i = indx; i >= 0 ; i--) {
260 1.1 bouyer if (bap[i]) {
261 1.2 bouyer return fs2h32(bap[i]) + 1;
262 1.1 bouyer }
263 1.1 bouyer }
264 1.1 bouyer }
265 1.1 bouyer
266 1.1 bouyer /* fall back to the first block of the cylinder containing the inode */
267 1.1 bouyer
268 1.1 bouyer cg = ino_to_cg(fs, ip->i_number);
269 1.1 bouyer return fs->e2fs.e2fs_bpg * cg + fs->e2fs.e2fs_first_dblock + 1;
270 1.1 bouyer }
271 1.1 bouyer
272 1.1 bouyer /*
273 1.1 bouyer * Implement the cylinder overflow algorithm.
274 1.1 bouyer *
275 1.1 bouyer * The policy implemented by this algorithm is:
276 1.1 bouyer * 1) allocate the block in its requested cylinder group.
277 1.1 bouyer * 2) quadradically rehash on the cylinder group number.
278 1.1 bouyer * 3) brute force search for a free block.
279 1.1 bouyer */
280 1.1 bouyer static u_long
281 1.26 xtraeme ext2fs_hashalloc(struct inode *ip, int cg, long pref, int size,
282 1.26 xtraeme daddr_t (*allocator)(struct inode *, int, daddr_t, int))
283 1.1 bouyer {
284 1.7 augustss struct m_ext2fs *fs;
285 1.1 bouyer long result;
286 1.1 bouyer int i, icg = cg;
287 1.1 bouyer
288 1.1 bouyer fs = ip->i_e2fs;
289 1.1 bouyer /*
290 1.1 bouyer * 1: preferred cylinder group
291 1.1 bouyer */
292 1.1 bouyer result = (*allocator)(ip, cg, pref, size);
293 1.1 bouyer if (result)
294 1.48 christos return result;
295 1.1 bouyer /*
296 1.1 bouyer * 2: quadratic rehash
297 1.1 bouyer */
298 1.1 bouyer for (i = 1; i < fs->e2fs_ncg; i *= 2) {
299 1.1 bouyer cg += i;
300 1.1 bouyer if (cg >= fs->e2fs_ncg)
301 1.1 bouyer cg -= fs->e2fs_ncg;
302 1.1 bouyer result = (*allocator)(ip, cg, 0, size);
303 1.1 bouyer if (result)
304 1.48 christos return result;
305 1.1 bouyer }
306 1.1 bouyer /*
307 1.1 bouyer * 3: brute force search
308 1.1 bouyer * Note that we start at i == 2, since 0 was checked initially,
309 1.1 bouyer * and 1 is always checked in the quadratic rehash.
310 1.1 bouyer */
311 1.1 bouyer cg = (icg + 2) % fs->e2fs_ncg;
312 1.1 bouyer for (i = 2; i < fs->e2fs_ncg; i++) {
313 1.1 bouyer result = (*allocator)(ip, cg, 0, size);
314 1.1 bouyer if (result)
315 1.48 christos return result;
316 1.1 bouyer cg++;
317 1.1 bouyer if (cg == fs->e2fs_ncg)
318 1.1 bouyer cg = 0;
319 1.1 bouyer }
320 1.48 christos return 0;
321 1.1 bouyer }
322 1.1 bouyer
323 1.1 bouyer /*
324 1.1 bouyer * Determine whether a block can be allocated.
325 1.1 bouyer *
326 1.1 bouyer * Check to see if a block of the appropriate size is available,
327 1.1 bouyer * and if it is, allocate it.
328 1.1 bouyer */
329 1.1 bouyer
330 1.15 fvdl static daddr_t
331 1.32 christos ext2fs_alloccg(struct inode *ip, int cg, daddr_t bpref, int size)
332 1.1 bouyer {
333 1.7 augustss struct m_ext2fs *fs;
334 1.7 augustss char *bbp;
335 1.1 bouyer struct buf *bp;
336 1.15 fvdl /* XXX ondisk32 */
337 1.1 bouyer int error, bno, start, end, loc;
338 1.1 bouyer
339 1.1 bouyer fs = ip->i_e2fs;
340 1.1 bouyer if (fs->e2fs_gd[cg].ext2bgd_nbfree == 0)
341 1.48 christos return 0;
342 1.45 dholland error = bread(ip->i_devvp, EXT2_FSBTODB(fs,
343 1.49 jdolecek fs2h32(fs->e2fs_gd[cg].ext2bgd_b_bitmap)),
344 1.46 maxv (int)fs->e2fs_bsize, B_MODIFY, &bp);
345 1.1 bouyer if (error) {
346 1.48 christos return 0;
347 1.1 bouyer }
348 1.1 bouyer bbp = (char *)bp->b_data;
349 1.1 bouyer
350 1.1 bouyer if (dtog(fs, bpref) != cg)
351 1.1 bouyer bpref = 0;
352 1.49 jdolecek
353 1.49 jdolecek /* initialize block bitmap now if uninit */
354 1.49 jdolecek if (__predict_false(E2FS_HAS_GD_CSUM(fs) &&
355 1.49 jdolecek (fs->e2fs_gd[cg].ext2bgd_flags & h2fs16(E2FS_BG_BLOCK_UNINIT)))) {
356 1.49 jdolecek ext2fs_init_bb(fs, cg, &fs->e2fs_gd[cg], bbp);
357 1.49 jdolecek fs->e2fs_gd[cg].ext2bgd_flags &= h2fs16(~E2FS_BG_BLOCK_UNINIT);
358 1.49 jdolecek }
359 1.49 jdolecek
360 1.1 bouyer if (bpref != 0) {
361 1.1 bouyer bpref = dtogd(fs, bpref);
362 1.1 bouyer /*
363 1.1 bouyer * if the requested block is available, use it
364 1.1 bouyer */
365 1.1 bouyer if (isclr(bbp, bpref)) {
366 1.1 bouyer bno = bpref;
367 1.1 bouyer goto gotit;
368 1.1 bouyer }
369 1.1 bouyer }
370 1.1 bouyer /*
371 1.1 bouyer * no blocks in the requested cylinder, so take next
372 1.1 bouyer * available one in this cylinder group.
373 1.1 bouyer * first try to get 8 contigous blocks, then fall back to a single
374 1.1 bouyer * block.
375 1.1 bouyer */
376 1.1 bouyer if (bpref)
377 1.1 bouyer start = dtogd(fs, bpref) / NBBY;
378 1.1 bouyer else
379 1.1 bouyer start = 0;
380 1.1 bouyer end = howmany(fs->e2fs.e2fs_fpg, NBBY) - start;
381 1.1 bouyer for (loc = start; loc < end; loc++) {
382 1.1 bouyer if (bbp[loc] == 0) {
383 1.1 bouyer bno = loc * NBBY;
384 1.1 bouyer goto gotit;
385 1.1 bouyer }
386 1.1 bouyer }
387 1.1 bouyer for (loc = 0; loc < start; loc++) {
388 1.1 bouyer if (bbp[loc] == 0) {
389 1.1 bouyer bno = loc * NBBY;
390 1.1 bouyer goto gotit;
391 1.1 bouyer }
392 1.1 bouyer }
393 1.1 bouyer
394 1.1 bouyer bno = ext2fs_mapsearch(fs, bbp, bpref);
395 1.50 jdolecek #if 0
396 1.51 jdolecek /*
397 1.51 jdolecek * XXX jdolecek mapsearch actually never fails, it panics instead.
398 1.51 jdolecek * If re-enabling, make sure to brele() before returning.
399 1.51 jdolecek */
400 1.1 bouyer if (bno < 0)
401 1.48 christos return 0;
402 1.50 jdolecek #endif
403 1.1 bouyer gotit:
404 1.1 bouyer #ifdef DIAGNOSTIC
405 1.15 fvdl if (isset(bbp, (daddr_t)bno)) {
406 1.1 bouyer printf("ext2fs_alloccgblk: cg=%d bno=%d fs=%s\n",
407 1.1 bouyer cg, bno, fs->e2fs_fsmnt);
408 1.2 bouyer panic("ext2fs_alloccg: dup alloc");
409 1.1 bouyer }
410 1.1 bouyer #endif
411 1.15 fvdl setbit(bbp, (daddr_t)bno);
412 1.1 bouyer fs->e2fs.e2fs_fbcount--;
413 1.49 jdolecek ext2fs_cg_update(fs, cg, &fs->e2fs_gd[cg], -1, 0, 0, 0);
414 1.1 bouyer fs->e2fs_fmod = 1;
415 1.1 bouyer bdwrite(bp);
416 1.48 christos return cg * fs->e2fs.e2fs_fpg + fs->e2fs.e2fs_first_dblock + bno;
417 1.1 bouyer }
418 1.1 bouyer
419 1.1 bouyer /*
420 1.1 bouyer * Determine whether an inode can be allocated.
421 1.1 bouyer *
422 1.1 bouyer * Check to see if an inode is available, and if it is,
423 1.1 bouyer * allocate it using the following policy:
424 1.1 bouyer * 1) allocate the requested inode.
425 1.1 bouyer * 2) allocate the next available inode after the requested
426 1.1 bouyer * inode in the specified cylinder group.
427 1.1 bouyer */
428 1.15 fvdl static daddr_t
429 1.26 xtraeme ext2fs_nodealloccg(struct inode *ip, int cg, daddr_t ipref, int mode)
430 1.1 bouyer {
431 1.7 augustss struct m_ext2fs *fs;
432 1.7 augustss char *ibp;
433 1.1 bouyer struct buf *bp;
434 1.1 bouyer int error, start, len, loc, map, i;
435 1.1 bouyer
436 1.1 bouyer ipref--; /* to avoid a lot of (ipref -1) */
437 1.33 chs if (ipref == -1)
438 1.33 chs ipref = 0;
439 1.1 bouyer fs = ip->i_e2fs;
440 1.1 bouyer if (fs->e2fs_gd[cg].ext2bgd_nifree == 0)
441 1.48 christos return 0;
442 1.45 dholland error = bread(ip->i_devvp, EXT2_FSBTODB(fs,
443 1.49 jdolecek fs2h32(fs->e2fs_gd[cg].ext2bgd_i_bitmap)),
444 1.46 maxv (int)fs->e2fs_bsize, B_MODIFY, &bp);
445 1.1 bouyer if (error) {
446 1.48 christos return 0;
447 1.1 bouyer }
448 1.1 bouyer ibp = (char *)bp->b_data;
449 1.49 jdolecek
450 1.49 jdolecek KASSERT(!E2FS_HAS_GD_CSUM(fs) || (fs->e2fs_gd[cg].ext2bgd_flags & h2fs16(E2FS_BG_INODE_ZEROED)) != 0);
451 1.49 jdolecek
452 1.49 jdolecek /* initialize inode bitmap now if uninit */
453 1.49 jdolecek if (__predict_false(E2FS_HAS_GD_CSUM(fs) &&
454 1.49 jdolecek (fs->e2fs_gd[cg].ext2bgd_flags & h2fs16(E2FS_BG_INODE_UNINIT)))) {
455 1.49 jdolecek KASSERT(fs2h16(fs->e2fs_gd[cg].ext2bgd_nifree) == fs->e2fs.e2fs_ipg);
456 1.49 jdolecek memset(ibp, 0, fs->e2fs_bsize);
457 1.49 jdolecek fs->e2fs_gd[cg].ext2bgd_flags &= h2fs16(~E2FS_BG_INODE_UNINIT);
458 1.49 jdolecek }
459 1.49 jdolecek
460 1.1 bouyer if (ipref) {
461 1.1 bouyer ipref %= fs->e2fs.e2fs_ipg;
462 1.1 bouyer if (isclr(ibp, ipref))
463 1.1 bouyer goto gotit;
464 1.1 bouyer }
465 1.1 bouyer start = ipref / NBBY;
466 1.1 bouyer len = howmany(fs->e2fs.e2fs_ipg - ipref, NBBY);
467 1.1 bouyer loc = skpc(0xff, len, &ibp[start]);
468 1.1 bouyer if (loc == 0) {
469 1.1 bouyer len = start + 1;
470 1.1 bouyer start = 0;
471 1.1 bouyer loc = skpc(0xff, len, &ibp[0]);
472 1.1 bouyer if (loc == 0) {
473 1.15 fvdl printf("cg = %d, ipref = %lld, fs = %s\n",
474 1.15 fvdl cg, (long long)ipref, fs->e2fs_fsmnt);
475 1.1 bouyer panic("ext2fs_nodealloccg: map corrupted");
476 1.1 bouyer /* NOTREACHED */
477 1.1 bouyer }
478 1.1 bouyer }
479 1.1 bouyer i = start + len - loc;
480 1.42 rmind map = ibp[i] ^ 0xff;
481 1.42 rmind if (map == 0) {
482 1.42 rmind printf("fs = %s\n", fs->e2fs_fsmnt);
483 1.49 jdolecek panic("ext2fs_nodealloccg: inode not in map");
484 1.1 bouyer }
485 1.42 rmind ipref = i * NBBY + ffs(map) - 1;
486 1.1 bouyer gotit:
487 1.1 bouyer setbit(ibp, ipref);
488 1.1 bouyer fs->e2fs.e2fs_ficount--;
489 1.49 jdolecek ext2fs_cg_update(fs, cg, &fs->e2fs_gd[cg],
490 1.49 jdolecek 0, -1, ((mode & IFMT) == IFDIR) ? 1 : 0, ipref);
491 1.1 bouyer fs->e2fs_fmod = 1;
492 1.1 bouyer bdwrite(bp);
493 1.48 christos return cg * fs->e2fs.e2fs_ipg + ipref + 1;
494 1.1 bouyer }
495 1.1 bouyer
496 1.1 bouyer /*
497 1.1 bouyer * Free a block.
498 1.1 bouyer *
499 1.1 bouyer * The specified block is placed back in the
500 1.1 bouyer * free map.
501 1.1 bouyer */
502 1.1 bouyer void
503 1.26 xtraeme ext2fs_blkfree(struct inode *ip, daddr_t bno)
504 1.1 bouyer {
505 1.7 augustss struct m_ext2fs *fs;
506 1.7 augustss char *bbp;
507 1.1 bouyer struct buf *bp;
508 1.1 bouyer int error, cg;
509 1.1 bouyer
510 1.1 bouyer fs = ip->i_e2fs;
511 1.1 bouyer cg = dtog(fs, bno);
512 1.49 jdolecek
513 1.49 jdolecek KASSERT(!E2FS_HAS_GD_CSUM(fs) || (fs->e2fs_gd[cg].ext2bgd_flags & h2fs16(E2FS_BG_BLOCK_UNINIT)) == 0);
514 1.49 jdolecek
515 1.1 bouyer if ((u_int)bno >= fs->e2fs.e2fs_bcount) {
516 1.25 christos printf("bad block %lld, ino %llu\n", (long long)bno,
517 1.25 christos (unsigned long long)ip->i_number);
518 1.37 mrg ext2fs_fserr(fs, ip->i_uid, "bad block");
519 1.1 bouyer return;
520 1.1 bouyer }
521 1.6 bouyer error = bread(ip->i_devvp,
522 1.49 jdolecek EXT2_FSBTODB(fs, fs2h32(fs->e2fs_gd[cg].ext2bgd_b_bitmap)),
523 1.46 maxv (int)fs->e2fs_bsize, B_MODIFY, &bp);
524 1.1 bouyer if (error) {
525 1.1 bouyer return;
526 1.1 bouyer }
527 1.1 bouyer bbp = (char *)bp->b_data;
528 1.1 bouyer bno = dtogd(fs, bno);
529 1.1 bouyer if (isclr(bbp, bno)) {
530 1.38 christos printf("dev = 0x%llx, block = %lld, fs = %s\n",
531 1.38 christos (unsigned long long)ip->i_dev, (long long)bno,
532 1.38 christos fs->e2fs_fsmnt);
533 1.1 bouyer panic("blkfree: freeing free block");
534 1.1 bouyer }
535 1.1 bouyer clrbit(bbp, bno);
536 1.1 bouyer fs->e2fs.e2fs_fbcount++;
537 1.49 jdolecek ext2fs_cg_update(fs, cg, &fs->e2fs_gd[cg], 1, 0, 0, 0);
538 1.1 bouyer fs->e2fs_fmod = 1;
539 1.1 bouyer bdwrite(bp);
540 1.1 bouyer }
541 1.1 bouyer
542 1.1 bouyer /*
543 1.1 bouyer * Free an inode.
544 1.1 bouyer *
545 1.1 bouyer * The specified inode is placed back in the free map.
546 1.1 bouyer */
547 1.1 bouyer int
548 1.27 yamt ext2fs_vfree(struct vnode *pvp, ino_t ino, int mode)
549 1.1 bouyer {
550 1.7 augustss struct m_ext2fs *fs;
551 1.7 augustss char *ibp;
552 1.7 augustss struct inode *pip;
553 1.1 bouyer struct buf *bp;
554 1.1 bouyer int error, cg;
555 1.1 bouyer
556 1.27 yamt pip = VTOI(pvp);
557 1.1 bouyer fs = pip->i_e2fs;
558 1.49 jdolecek
559 1.33 chs if ((u_int)ino > fs->e2fs.e2fs_icount || (u_int)ino < EXT2_FIRSTINO)
560 1.38 christos panic("ifree: range: dev = 0x%llx, ino = %llu, fs = %s",
561 1.38 christos (unsigned long long)pip->i_dev, (unsigned long long)ino,
562 1.38 christos fs->e2fs_fsmnt);
563 1.49 jdolecek
564 1.1 bouyer cg = ino_to_cg(fs, ino);
565 1.49 jdolecek
566 1.49 jdolecek KASSERT(!E2FS_HAS_GD_CSUM(fs) || (fs->e2fs_gd[cg].ext2bgd_flags & h2fs16(E2FS_BG_INODE_UNINIT)) == 0);
567 1.49 jdolecek
568 1.6 bouyer error = bread(pip->i_devvp,
569 1.49 jdolecek EXT2_FSBTODB(fs, fs2h32(fs->e2fs_gd[cg].ext2bgd_i_bitmap)),
570 1.46 maxv (int)fs->e2fs_bsize, B_MODIFY, &bp);
571 1.1 bouyer if (error) {
572 1.48 christos return 0;
573 1.1 bouyer }
574 1.1 bouyer ibp = (char *)bp->b_data;
575 1.1 bouyer ino = (ino - 1) % fs->e2fs.e2fs_ipg;
576 1.1 bouyer if (isclr(ibp, ino)) {
577 1.38 christos printf("dev = 0x%llx, ino = %llu, fs = %s\n",
578 1.38 christos (unsigned long long)pip->i_dev,
579 1.38 christos (unsigned long long)ino, fs->e2fs_fsmnt);
580 1.1 bouyer if (fs->e2fs_ronly == 0)
581 1.1 bouyer panic("ifree: freeing free inode");
582 1.1 bouyer }
583 1.1 bouyer clrbit(ibp, ino);
584 1.1 bouyer fs->e2fs.e2fs_ficount++;
585 1.49 jdolecek ext2fs_cg_update(fs, cg, &fs->e2fs_gd[cg],
586 1.49 jdolecek 0, 1, ((mode & IFMT) == IFDIR) ? -1 : 0, 0);
587 1.1 bouyer fs->e2fs_fmod = 1;
588 1.1 bouyer bdwrite(bp);
589 1.48 christos return 0;
590 1.1 bouyer }
591 1.1 bouyer
592 1.1 bouyer /*
593 1.1 bouyer * Find a block in the specified cylinder group.
594 1.1 bouyer *
595 1.1 bouyer * It is a panic if a request is made to find a block if none are
596 1.1 bouyer * available.
597 1.1 bouyer */
598 1.1 bouyer
599 1.15 fvdl static daddr_t
600 1.26 xtraeme ext2fs_mapsearch(struct m_ext2fs *fs, char *bbp, daddr_t bpref)
601 1.1 bouyer {
602 1.1 bouyer int start, len, loc, i, map;
603 1.1 bouyer
604 1.1 bouyer /*
605 1.1 bouyer * find the fragment by searching through the free block
606 1.1 bouyer * map for an appropriate bit pattern
607 1.1 bouyer */
608 1.1 bouyer if (bpref)
609 1.1 bouyer start = dtogd(fs, bpref) / NBBY;
610 1.1 bouyer else
611 1.1 bouyer start = 0;
612 1.1 bouyer len = howmany(fs->e2fs.e2fs_fpg, NBBY) - start;
613 1.1 bouyer loc = skpc(0xff, len, &bbp[start]);
614 1.1 bouyer if (loc == 0) {
615 1.1 bouyer len = start + 1;
616 1.1 bouyer start = 0;
617 1.1 bouyer loc = skpc(0xff, len, &bbp[start]);
618 1.1 bouyer if (loc == 0) {
619 1.1 bouyer printf("start = %d, len = %d, fs = %s\n",
620 1.1 bouyer start, len, fs->e2fs_fsmnt);
621 1.1 bouyer panic("ext2fs_alloccg: map corrupted");
622 1.1 bouyer /* NOTREACHED */
623 1.1 bouyer }
624 1.1 bouyer }
625 1.1 bouyer i = start + len - loc;
626 1.42 rmind map = bbp[i] ^ 0xff;
627 1.42 rmind if (map == 0) {
628 1.42 rmind printf("fs = %s\n", fs->e2fs_fsmnt);
629 1.42 rmind panic("ext2fs_mapsearch: block not in map");
630 1.42 rmind }
631 1.42 rmind return i * NBBY + ffs(map) - 1;
632 1.1 bouyer }
633 1.1 bouyer
634 1.1 bouyer /*
635 1.1 bouyer * Fserr prints the name of a file system with an error diagnostic.
636 1.23 perry *
637 1.1 bouyer * The form of the error message is:
638 1.1 bouyer * fs: error message
639 1.1 bouyer */
640 1.1 bouyer static void
641 1.26 xtraeme ext2fs_fserr(struct m_ext2fs *fs, u_int uid, const char *cp)
642 1.1 bouyer {
643 1.1 bouyer
644 1.1 bouyer log(LOG_ERR, "uid %d on %s: %s\n", uid, fs->e2fs_fsmnt, cp);
645 1.1 bouyer }
646 1.49 jdolecek
647 1.49 jdolecek static __inline void
648 1.49 jdolecek ext2fs_cg_update(struct m_ext2fs *fs, int cg, struct ext2_gd *gd, int nbfree, int nifree, int ndirs, daddr_t ioff)
649 1.49 jdolecek {
650 1.49 jdolecek /* XXX disk32 */
651 1.49 jdolecek if (nifree) {
652 1.49 jdolecek gd->ext2bgd_nifree = h2fs16(fs2h16(gd->ext2bgd_nifree) + nifree);
653 1.49 jdolecek /*
654 1.49 jdolecek * If we allocated inode on bigger offset than what was
655 1.49 jdolecek * ever used before, bump the itable_unused count. This
656 1.49 jdolecek * member only ever grows, and is used only for initialization
657 1.49 jdolecek * !INODE_ZEROED groups with used inodes. Of course, by the
658 1.49 jdolecek * time we get here the itables are already zeroed, but
659 1.49 jdolecek * e2fstools fsck.ext4 still checks this.
660 1.49 jdolecek */
661 1.49 jdolecek if (E2FS_HAS_GD_CSUM(fs) && nifree < 0 && (ioff+1) >= (fs->e2fs.e2fs_ipg - fs2h16(gd->ext2bgd_itable_unused_lo))) {
662 1.49 jdolecek gd->ext2bgd_itable_unused_lo = h2fs16(fs->e2fs.e2fs_ipg - (ioff + 1));
663 1.49 jdolecek }
664 1.49 jdolecek
665 1.49 jdolecek KASSERT(!E2FS_HAS_GD_CSUM(fs) || gd->ext2bgd_itable_unused_lo <= gd->ext2bgd_nifree);
666 1.49 jdolecek }
667 1.49 jdolecek
668 1.49 jdolecek
669 1.49 jdolecek if (nbfree)
670 1.49 jdolecek gd->ext2bgd_nbfree = h2fs16(fs2h16(gd->ext2bgd_nbfree) + nbfree);
671 1.49 jdolecek
672 1.49 jdolecek if (ndirs)
673 1.49 jdolecek gd->ext2bgd_ndirs = h2fs16(fs2h16(gd->ext2bgd_ndirs) + ndirs);
674 1.49 jdolecek
675 1.49 jdolecek if (E2FS_HAS_GD_CSUM(fs))
676 1.49 jdolecek gd->ext2bgd_checksum = ext2fs_cg_get_csum(fs, cg, gd);
677 1.49 jdolecek }
678 1.49 jdolecek
679 1.49 jdolecek /*
680 1.49 jdolecek * Compute group description csum. Structure data must be LE (not host).
681 1.49 jdolecek * Returned as LE (disk encoding).
682 1.49 jdolecek */
683 1.49 jdolecek static uint16_t
684 1.49 jdolecek ext2fs_cg_get_csum(struct m_ext2fs *fs, int cg, struct ext2_gd *gd)
685 1.49 jdolecek {
686 1.49 jdolecek uint16_t crc;
687 1.49 jdolecek uint32_t cg_bswapped = h2fs32((uint32_t)cg);
688 1.49 jdolecek size_t off;
689 1.49 jdolecek
690 1.49 jdolecek if (!EXT2F_HAS_ROCOMPAT_FEATURE(fs, EXT2F_ROCOMPAT_GDT_CSUM))
691 1.49 jdolecek return 0;
692 1.49 jdolecek
693 1.49 jdolecek off = offsetof(struct ext2_gd, ext2bgd_checksum);
694 1.49 jdolecek
695 1.49 jdolecek crc = crc16(~0, (uint8_t *)fs->e2fs.e2fs_uuid, sizeof(fs->e2fs.e2fs_uuid));
696 1.49 jdolecek crc = crc16(crc, (uint8_t *)&cg_bswapped, sizeof(cg_bswapped));
697 1.49 jdolecek crc = crc16(crc, (uint8_t *)gd, off);
698 1.49 jdolecek /* XXX ondisk32 */
699 1.49 jdolecek
700 1.49 jdolecek return h2fs16(crc);
701 1.49 jdolecek }
702 1.49 jdolecek
703 1.49 jdolecek static void
704 1.49 jdolecek ext2fs_init_bb(struct m_ext2fs *fs, int cg, struct ext2_gd *gd, char *bbp)
705 1.49 jdolecek {
706 1.49 jdolecek int i;
707 1.49 jdolecek
708 1.49 jdolecek memset(bbp, 0, fs->e2fs_bsize);
709 1.49 jdolecek
710 1.49 jdolecek /*
711 1.49 jdolecek * No block was ever allocated on this cg before, so the only used
712 1.49 jdolecek * blocks are metadata blocks on start of the group. We could optimize
713 1.49 jdolecek * this to set by bytes, but since this is done once per the group
714 1.49 jdolecek * in lifetime of filesystem, it really is not worth it.
715 1.49 jdolecek */
716 1.49 jdolecek for(i=0; i < fs->e2fs.e2fs_bpg - fs2h16(gd->ext2bgd_nbfree); i++)
717 1.49 jdolecek setbit(bbp, i);
718 1.49 jdolecek }
719 1.49 jdolecek
720 1.49 jdolecek /*
721 1.49 jdolecek * Verify csum and initialize itable if not done already
722 1.49 jdolecek */
723 1.49 jdolecek int
724 1.49 jdolecek ext2fs_cg_verify_and_initialize(struct vnode *devvp, struct m_ext2fs *fs, int ronly)
725 1.49 jdolecek {
726 1.49 jdolecek /* XXX disk32 */
727 1.49 jdolecek struct ext2_gd *gd;
728 1.49 jdolecek ino_t ioff;
729 1.49 jdolecek size_t boff;
730 1.49 jdolecek struct buf *bp;
731 1.49 jdolecek int cg, i, error;
732 1.49 jdolecek
733 1.49 jdolecek if (!E2FS_HAS_GD_CSUM(fs))
734 1.49 jdolecek return 0;
735 1.49 jdolecek
736 1.49 jdolecek for(cg=0; cg < fs->e2fs_ncg; cg++) {
737 1.49 jdolecek gd = &fs->e2fs_gd[cg];
738 1.49 jdolecek
739 1.49 jdolecek /* Verify checksum */
740 1.49 jdolecek if (gd->ext2bgd_checksum != ext2fs_cg_get_csum(fs, cg, gd)) {
741 1.49 jdolecek printf("ext2fs_cg_verify_and_initialize: group %d invalid csum\n", cg);
742 1.49 jdolecek return EINVAL;
743 1.49 jdolecek }
744 1.49 jdolecek
745 1.49 jdolecek /* if mounting read-write, zero itable if not already done */
746 1.49 jdolecek if (ronly || (gd->ext2bgd_flags & h2fs16(E2FS_BG_INODE_ZEROED)) != 0)
747 1.49 jdolecek continue;
748 1.49 jdolecek
749 1.49 jdolecek /*
750 1.49 jdolecek * We are skipping already used inodes, zero rest of itable
751 1.49 jdolecek * blocks. First block to zero could be only partial wipe, all
752 1.49 jdolecek * others are wiped completely. This might take a while,
753 1.49 jdolecek * there could be many inode table blocks. We use
754 1.49 jdolecek * delayed writes, so this shouldn't block for very
755 1.49 jdolecek * long.
756 1.49 jdolecek */
757 1.49 jdolecek ioff = fs->e2fs.e2fs_ipg - fs2h16(gd->ext2bgd_itable_unused_lo);
758 1.49 jdolecek boff = (ioff % fs->e2fs_ipb) * EXT2_DINODE_SIZE(fs);
759 1.49 jdolecek
760 1.49 jdolecek for(i = ioff / fs->e2fs_ipb; i < fs->e2fs_itpg; i++) {
761 1.49 jdolecek if (boff) {
762 1.49 jdolecek /* partial wipe, must read old data */
763 1.49 jdolecek error = bread(devvp,
764 1.49 jdolecek EXT2_FSBTODB(fs, fs2h32(gd->ext2bgd_i_tables) + i),
765 1.49 jdolecek (int)fs->e2fs_bsize, B_MODIFY, &bp);
766 1.49 jdolecek if (error) {
767 1.49 jdolecek printf("ext2fs_cg_verify_and_initialize: can't read itable block");
768 1.49 jdolecek return error;
769 1.49 jdolecek }
770 1.49 jdolecek memset((char *)bp->b_data + boff, 0, fs->e2fs_bsize - boff);
771 1.49 jdolecek boff = 0;
772 1.49 jdolecek } else {
773 1.49 jdolecek /*
774 1.49 jdolecek * Complete wipe, don't need to read data. This
775 1.49 jdolecek * assumes nothing else is changing the data.
776 1.49 jdolecek */
777 1.49 jdolecek bp = getblk(devvp,
778 1.49 jdolecek EXT2_FSBTODB(fs, fs2h32(gd->ext2bgd_i_tables) + i),
779 1.49 jdolecek (int)fs->e2fs_bsize, 0, 0);
780 1.49 jdolecek clrbuf(bp);
781 1.49 jdolecek }
782 1.49 jdolecek
783 1.49 jdolecek bdwrite(bp);
784 1.49 jdolecek }
785 1.49 jdolecek
786 1.49 jdolecek gd->ext2bgd_flags |= h2fs16(E2FS_BG_INODE_ZEROED);
787 1.49 jdolecek gd->ext2bgd_checksum = ext2fs_cg_get_csum(fs, cg, gd);
788 1.49 jdolecek fs->e2fs_fmod = 1;
789 1.49 jdolecek }
790 1.49 jdolecek
791 1.49 jdolecek return 0;
792 1.49 jdolecek }
793