ulfs_dirhash.c revision 1.2 1 1.2 dholland /* $NetBSD: ulfs_dirhash.c,v 1.2 2013/06/06 00:44:40 dholland Exp $ */
2 1.1 dholland /* from NetBSD: ufs_dirhash.c,v 1.34 2009/10/05 23:48:08 rmind Exp */
3 1.1 dholland
4 1.1 dholland /*
5 1.1 dholland * Copyright (c) 2001, 2002 Ian Dowse. All rights reserved.
6 1.1 dholland *
7 1.1 dholland * Redistribution and use in source and binary forms, with or without
8 1.1 dholland * modification, are permitted provided that the following conditions
9 1.1 dholland * are met:
10 1.1 dholland * 1. Redistributions of source code must retain the above copyright
11 1.1 dholland * notice, this list of conditions and the following disclaimer.
12 1.1 dholland * 2. Redistributions in binary form must reproduce the above copyright
13 1.1 dholland * notice, this list of conditions and the following disclaimer in the
14 1.1 dholland * documentation and/or other materials provided with the distribution.
15 1.1 dholland *
16 1.1 dholland * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
17 1.1 dholland * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18 1.1 dholland * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19 1.1 dholland * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
20 1.1 dholland * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21 1.1 dholland * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
22 1.1 dholland * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23 1.1 dholland * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
24 1.1 dholland * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25 1.1 dholland * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26 1.1 dholland * SUCH DAMAGE.
27 1.1 dholland *
28 1.1 dholland * $FreeBSD: src/sys/ufs/ufs/ufs_dirhash.c,v 1.3.2.8 2004/12/08 11:54:13 dwmalone Exp $
29 1.1 dholland */
30 1.1 dholland
31 1.1 dholland #include <sys/cdefs.h>
32 1.2 dholland __KERNEL_RCSID(0, "$NetBSD: ulfs_dirhash.c,v 1.2 2013/06/06 00:44:40 dholland Exp $");
33 1.1 dholland
34 1.1 dholland /*
35 1.1 dholland * This implements a hash-based lookup scheme for UFS directories.
36 1.1 dholland */
37 1.1 dholland
38 1.1 dholland #include <sys/param.h>
39 1.1 dholland #include <sys/systm.h>
40 1.1 dholland #include <sys/kernel.h>
41 1.1 dholland #include <sys/kmem.h>
42 1.1 dholland #include <sys/types.h>
43 1.1 dholland #include <sys/hash.h>
44 1.1 dholland #include <sys/proc.h>
45 1.1 dholland #include <sys/buf.h>
46 1.1 dholland #include <sys/vnode.h>
47 1.1 dholland #include <sys/mount.h>
48 1.1 dholland #include <sys/pool.h>
49 1.1 dholland #include <sys/sysctl.h>
50 1.1 dholland #include <sys/atomic.h>
51 1.1 dholland
52 1.2 dholland #include <ufs/lfs/ulfs_inode.h>
53 1.2 dholland #include <ufs/lfs/ulfs_dir.h>
54 1.2 dholland #include <ufs/lfs/ulfs_dirhash.h>
55 1.2 dholland #include <ufs/lfs/ulfsmount.h>
56 1.2 dholland #include <ufs/lfs/ulfs_bswap.h>
57 1.2 dholland #include <ufs/lfs/ulfs_extern.h>
58 1.1 dholland
59 1.1 dholland #define WRAPINCR(val, limit) (((val) + 1 == (limit)) ? 0 : ((val) + 1))
60 1.1 dholland #define WRAPDECR(val, limit) (((val) == 0) ? ((limit) - 1) : ((val) - 1))
61 1.1 dholland #define OFSFMT(ip) ((ip)->i_ump->um_maxsymlinklen <= 0)
62 1.1 dholland #define BLKFREE2IDX(n) ((n) > DH_NFSTATS ? DH_NFSTATS : (n))
63 1.1 dholland
64 1.1 dholland static u_int ufs_dirhashminblks = 5;
65 1.1 dholland static u_int ufs_dirhashmaxmem = 2 * 1024 * 1024;
66 1.1 dholland static u_int ufs_dirhashmem;
67 1.1 dholland static u_int ufs_dirhashcheck = 0;
68 1.1 dholland
69 1.1 dholland static int ufsdirhash_hash(struct dirhash *dh, const char *name, int namelen);
70 1.1 dholland static void ufsdirhash_adjfree(struct dirhash *dh, doff_t offset, int diff,
71 1.1 dholland int dirblksiz);
72 1.1 dholland static void ufsdirhash_delslot(struct dirhash *dh, int slot);
73 1.1 dholland static int ufsdirhash_findslot(struct dirhash *dh, const char *name,
74 1.1 dholland int namelen, doff_t offset);
75 1.1 dholland static doff_t ufsdirhash_getprev(struct direct *dp, doff_t offset,
76 1.1 dholland int dirblksiz);
77 1.1 dholland static int ufsdirhash_recycle(int wanted);
78 1.1 dholland
79 1.1 dholland static pool_cache_t ufsdirhashblk_cache;
80 1.1 dholland static pool_cache_t ufsdirhash_cache;
81 1.1 dholland
82 1.1 dholland #define DIRHASHLIST_LOCK() mutex_enter(&ufsdirhash_lock)
83 1.1 dholland #define DIRHASHLIST_UNLOCK() mutex_exit(&ufsdirhash_lock)
84 1.1 dholland #define DIRHASH_LOCK(dh) mutex_enter(&(dh)->dh_lock)
85 1.1 dholland #define DIRHASH_UNLOCK(dh) mutex_exit(&(dh)->dh_lock)
86 1.1 dholland #define DIRHASH_BLKALLOC() \
87 1.1 dholland pool_cache_get(ufsdirhashblk_cache, PR_NOWAIT)
88 1.1 dholland #define DIRHASH_BLKFREE(ptr) \
89 1.1 dholland pool_cache_put(ufsdirhashblk_cache, ptr)
90 1.1 dholland
91 1.1 dholland /* Dirhash list; recently-used entries are near the tail. */
92 1.1 dholland static TAILQ_HEAD(, dirhash) ufsdirhash_list;
93 1.1 dholland
94 1.1 dholland /* Protects: ufsdirhash_list, `dh_list' field, ufs_dirhashmem. */
95 1.1 dholland static kmutex_t ufsdirhash_lock;
96 1.1 dholland
97 1.1 dholland static struct sysctllog *ufsdirhash_sysctl_log;
98 1.1 dholland
99 1.1 dholland /*
100 1.1 dholland * Locking order:
101 1.1 dholland * ufsdirhash_lock
102 1.1 dholland * dh_lock
103 1.1 dholland *
104 1.1 dholland * The dh_lock mutex should be acquired either via the inode lock, or via
105 1.1 dholland * ufsdirhash_lock. Only the owner of the inode may free the associated
106 1.1 dholland * dirhash, but anything can steal its memory and set dh_hash to NULL.
107 1.1 dholland */
108 1.1 dholland
109 1.1 dholland /*
110 1.1 dholland * Attempt to build up a hash table for the directory contents in
111 1.1 dholland * inode 'ip'. Returns 0 on success, or -1 of the operation failed.
112 1.1 dholland */
113 1.1 dholland int
114 1.1 dholland ufsdirhash_build(struct inode *ip)
115 1.1 dholland {
116 1.1 dholland struct dirhash *dh;
117 1.1 dholland struct buf *bp = NULL;
118 1.1 dholland struct direct *ep;
119 1.1 dholland struct vnode *vp;
120 1.1 dholland doff_t bmask, pos;
121 1.1 dholland int dirblocks, i, j, memreqd, nblocks, narrays, nslots, slot;
122 1.1 dholland const int needswap = UFS_MPNEEDSWAP(ip->i_ump);
123 1.1 dholland int dirblksiz = ip->i_ump->um_dirblksiz;
124 1.1 dholland
125 1.1 dholland /* Check if we can/should use dirhash. */
126 1.1 dholland if (ip->i_dirhash == NULL) {
127 1.1 dholland if (ip->i_size < (ufs_dirhashminblks * dirblksiz) || OFSFMT(ip))
128 1.1 dholland return (-1);
129 1.1 dholland } else {
130 1.1 dholland /* Hash exists, but sysctls could have changed. */
131 1.1 dholland if (ip->i_size < (ufs_dirhashminblks * dirblksiz) ||
132 1.1 dholland ufs_dirhashmem > ufs_dirhashmaxmem) {
133 1.1 dholland ufsdirhash_free(ip);
134 1.1 dholland return (-1);
135 1.1 dholland }
136 1.1 dholland /* Check if hash exists and is intact (note: unlocked read). */
137 1.1 dholland if (ip->i_dirhash->dh_hash != NULL)
138 1.1 dholland return (0);
139 1.1 dholland /* Free the old, recycled hash and build a new one. */
140 1.1 dholland ufsdirhash_free(ip);
141 1.1 dholland }
142 1.1 dholland
143 1.1 dholland /* Don't hash removed directories. */
144 1.1 dholland if (ip->i_nlink == 0)
145 1.1 dholland return (-1);
146 1.1 dholland
147 1.1 dholland vp = ip->i_vnode;
148 1.1 dholland /* Allocate 50% more entries than this dir size could ever need. */
149 1.1 dholland KASSERT(ip->i_size >= dirblksiz);
150 1.1 dholland nslots = ip->i_size / DIRECTSIZ(1);
151 1.1 dholland nslots = (nslots * 3 + 1) / 2;
152 1.1 dholland narrays = howmany(nslots, DH_NBLKOFF);
153 1.1 dholland nslots = narrays * DH_NBLKOFF;
154 1.1 dholland dirblocks = howmany(ip->i_size, dirblksiz);
155 1.1 dholland nblocks = (dirblocks * 3 + 1) / 2;
156 1.1 dholland
157 1.1 dholland memreqd = sizeof(*dh) + narrays * sizeof(*dh->dh_hash) +
158 1.1 dholland narrays * DH_NBLKOFF * sizeof(**dh->dh_hash) +
159 1.1 dholland nblocks * sizeof(*dh->dh_blkfree);
160 1.1 dholland
161 1.1 dholland while (atomic_add_int_nv(&ufs_dirhashmem, memreqd) >
162 1.1 dholland ufs_dirhashmaxmem) {
163 1.1 dholland atomic_add_int(&ufs_dirhashmem, -memreqd);
164 1.1 dholland if (memreqd > ufs_dirhashmaxmem / 2)
165 1.1 dholland return (-1);
166 1.1 dholland /* Try to free some space. */
167 1.1 dholland if (ufsdirhash_recycle(memreqd) != 0)
168 1.1 dholland return (-1);
169 1.1 dholland else
170 1.1 dholland DIRHASHLIST_UNLOCK();
171 1.1 dholland }
172 1.1 dholland
173 1.1 dholland /*
174 1.1 dholland * Use non-blocking mallocs so that we will revert to a linear
175 1.1 dholland * lookup on failure rather than potentially blocking forever.
176 1.1 dholland */
177 1.1 dholland dh = pool_cache_get(ufsdirhash_cache, PR_NOWAIT);
178 1.1 dholland if (dh == NULL) {
179 1.1 dholland atomic_add_int(&ufs_dirhashmem, -memreqd);
180 1.1 dholland return (-1);
181 1.1 dholland }
182 1.1 dholland memset(dh, 0, sizeof(*dh));
183 1.1 dholland mutex_init(&dh->dh_lock, MUTEX_DEFAULT, IPL_NONE);
184 1.1 dholland DIRHASH_LOCK(dh);
185 1.1 dholland dh->dh_hashsz = narrays * sizeof(dh->dh_hash[0]);
186 1.1 dholland dh->dh_hash = kmem_zalloc(dh->dh_hashsz, KM_NOSLEEP);
187 1.1 dholland dh->dh_blkfreesz = nblocks * sizeof(dh->dh_blkfree[0]);
188 1.1 dholland dh->dh_blkfree = kmem_zalloc(dh->dh_blkfreesz, KM_NOSLEEP);
189 1.1 dholland if (dh->dh_hash == NULL || dh->dh_blkfree == NULL)
190 1.1 dholland goto fail;
191 1.1 dholland for (i = 0; i < narrays; i++) {
192 1.1 dholland if ((dh->dh_hash[i] = DIRHASH_BLKALLOC()) == NULL)
193 1.1 dholland goto fail;
194 1.1 dholland for (j = 0; j < DH_NBLKOFF; j++)
195 1.1 dholland dh->dh_hash[i][j] = DIRHASH_EMPTY;
196 1.1 dholland }
197 1.1 dholland
198 1.1 dholland /* Initialise the hash table and block statistics. */
199 1.1 dholland dh->dh_narrays = narrays;
200 1.1 dholland dh->dh_hlen = nslots;
201 1.1 dholland dh->dh_nblk = nblocks;
202 1.1 dholland dh->dh_dirblks = dirblocks;
203 1.1 dholland for (i = 0; i < dirblocks; i++)
204 1.1 dholland dh->dh_blkfree[i] = dirblksiz / DIRALIGN;
205 1.1 dholland for (i = 0; i < DH_NFSTATS; i++)
206 1.1 dholland dh->dh_firstfree[i] = -1;
207 1.1 dholland dh->dh_firstfree[DH_NFSTATS] = 0;
208 1.1 dholland dh->dh_seqopt = 0;
209 1.1 dholland dh->dh_seqoff = 0;
210 1.1 dholland dh->dh_score = DH_SCOREINIT;
211 1.1 dholland ip->i_dirhash = dh;
212 1.1 dholland
213 1.1 dholland bmask = VFSTOUFS(vp->v_mount)->um_mountp->mnt_stat.f_iosize - 1;
214 1.1 dholland pos = 0;
215 1.1 dholland while (pos < ip->i_size) {
216 1.1 dholland if ((curcpu()->ci_schedstate.spc_flags & SPCF_SHOULDYIELD)
217 1.1 dholland != 0) {
218 1.1 dholland preempt();
219 1.1 dholland }
220 1.1 dholland /* If necessary, get the next directory block. */
221 1.1 dholland if ((pos & bmask) == 0) {
222 1.1 dholland if (bp != NULL)
223 1.1 dholland brelse(bp, 0);
224 1.1 dholland if (ufs_blkatoff(vp, (off_t)pos, NULL, &bp, false) != 0)
225 1.1 dholland goto fail;
226 1.1 dholland }
227 1.1 dholland
228 1.1 dholland /* Add this entry to the hash. */
229 1.1 dholland ep = (struct direct *)((char *)bp->b_data + (pos & bmask));
230 1.1 dholland if (ep->d_reclen == 0 || ep->d_reclen >
231 1.1 dholland dirblksiz - (pos & (dirblksiz - 1))) {
232 1.1 dholland /* Corrupted directory. */
233 1.1 dholland brelse(bp, 0);
234 1.1 dholland goto fail;
235 1.1 dholland }
236 1.1 dholland if (ep->d_ino != 0) {
237 1.1 dholland /* Add the entry (simplified ufsdirhash_add). */
238 1.1 dholland slot = ufsdirhash_hash(dh, ep->d_name, ep->d_namlen);
239 1.1 dholland while (DH_ENTRY(dh, slot) != DIRHASH_EMPTY)
240 1.1 dholland slot = WRAPINCR(slot, dh->dh_hlen);
241 1.1 dholland dh->dh_hused++;
242 1.1 dholland DH_ENTRY(dh, slot) = pos;
243 1.1 dholland ufsdirhash_adjfree(dh, pos, -DIRSIZ(0, ep, needswap),
244 1.1 dholland dirblksiz);
245 1.1 dholland }
246 1.1 dholland pos += ep->d_reclen;
247 1.1 dholland }
248 1.1 dholland
249 1.1 dholland if (bp != NULL)
250 1.1 dholland brelse(bp, 0);
251 1.1 dholland DIRHASHLIST_LOCK();
252 1.1 dholland TAILQ_INSERT_TAIL(&ufsdirhash_list, dh, dh_list);
253 1.1 dholland dh->dh_onlist = 1;
254 1.1 dholland DIRHASH_UNLOCK(dh);
255 1.1 dholland DIRHASHLIST_UNLOCK();
256 1.1 dholland return (0);
257 1.1 dholland
258 1.1 dholland fail:
259 1.1 dholland DIRHASH_UNLOCK(dh);
260 1.1 dholland if (dh->dh_hash != NULL) {
261 1.1 dholland for (i = 0; i < narrays; i++)
262 1.1 dholland if (dh->dh_hash[i] != NULL)
263 1.1 dholland DIRHASH_BLKFREE(dh->dh_hash[i]);
264 1.1 dholland kmem_free(dh->dh_hash, dh->dh_hashsz);
265 1.1 dholland }
266 1.1 dholland if (dh->dh_blkfree != NULL)
267 1.1 dholland kmem_free(dh->dh_blkfree, dh->dh_blkfreesz);
268 1.1 dholland mutex_destroy(&dh->dh_lock);
269 1.1 dholland pool_cache_put(ufsdirhash_cache, dh);
270 1.1 dholland ip->i_dirhash = NULL;
271 1.1 dholland atomic_add_int(&ufs_dirhashmem, -memreqd);
272 1.1 dholland return (-1);
273 1.1 dholland }
274 1.1 dholland
275 1.1 dholland /*
276 1.1 dholland * Free any hash table associated with inode 'ip'.
277 1.1 dholland */
278 1.1 dholland void
279 1.1 dholland ufsdirhash_free(struct inode *ip)
280 1.1 dholland {
281 1.1 dholland struct dirhash *dh;
282 1.1 dholland int i, mem;
283 1.1 dholland
284 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
285 1.1 dholland return;
286 1.1 dholland
287 1.1 dholland if (dh->dh_onlist) {
288 1.1 dholland DIRHASHLIST_LOCK();
289 1.1 dholland if (dh->dh_onlist)
290 1.1 dholland TAILQ_REMOVE(&ufsdirhash_list, dh, dh_list);
291 1.1 dholland DIRHASHLIST_UNLOCK();
292 1.1 dholland }
293 1.1 dholland
294 1.1 dholland /* The dirhash pointed to by 'dh' is exclusively ours now. */
295 1.1 dholland mem = sizeof(*dh);
296 1.1 dholland if (dh->dh_hash != NULL) {
297 1.1 dholland for (i = 0; i < dh->dh_narrays; i++)
298 1.1 dholland DIRHASH_BLKFREE(dh->dh_hash[i]);
299 1.1 dholland kmem_free(dh->dh_hash, dh->dh_hashsz);
300 1.1 dholland kmem_free(dh->dh_blkfree, dh->dh_blkfreesz);
301 1.1 dholland mem += dh->dh_hashsz;
302 1.1 dholland mem += dh->dh_narrays * DH_NBLKOFF * sizeof(**dh->dh_hash);
303 1.1 dholland mem += dh->dh_nblk * sizeof(*dh->dh_blkfree);
304 1.1 dholland }
305 1.1 dholland mutex_destroy(&dh->dh_lock);
306 1.1 dholland pool_cache_put(ufsdirhash_cache, dh);
307 1.1 dholland ip->i_dirhash = NULL;
308 1.1 dholland
309 1.1 dholland atomic_add_int(&ufs_dirhashmem, -mem);
310 1.1 dholland }
311 1.1 dholland
312 1.1 dholland /*
313 1.1 dholland * Find the offset of the specified name within the given inode.
314 1.1 dholland * Returns 0 on success, ENOENT if the entry does not exist, or
315 1.1 dholland * EJUSTRETURN if the caller should revert to a linear search.
316 1.1 dholland *
317 1.1 dholland * If successful, the directory offset is stored in *offp, and a
318 1.1 dholland * pointer to a struct buf containing the entry is stored in *bpp. If
319 1.1 dholland * prevoffp is non-NULL, the offset of the previous entry within
320 1.1 dholland * the DIRBLKSIZ-sized block is stored in *prevoffp (if the entry
321 1.1 dholland * is the first in a block, the start of the block is used).
322 1.1 dholland */
323 1.1 dholland int
324 1.1 dholland ufsdirhash_lookup(struct inode *ip, const char *name, int namelen, doff_t *offp,
325 1.1 dholland struct buf **bpp, doff_t *prevoffp)
326 1.1 dholland {
327 1.1 dholland struct dirhash *dh, *dh_next;
328 1.1 dholland struct direct *dp;
329 1.1 dholland struct vnode *vp;
330 1.1 dholland struct buf *bp;
331 1.1 dholland doff_t blkoff, bmask, offset, prevoff;
332 1.1 dholland int i, slot;
333 1.1 dholland const int needswap = UFS_MPNEEDSWAP(ip->i_ump);
334 1.1 dholland int dirblksiz = ip->i_ump->um_dirblksiz;
335 1.1 dholland
336 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
337 1.1 dholland return (EJUSTRETURN);
338 1.1 dholland
339 1.1 dholland /*
340 1.1 dholland * Move this dirhash towards the end of the list if it has a
341 1.1 dholland * score higher than the next entry, and acquire the dh_lock.
342 1.1 dholland * Optimise the case where it's already the last by performing
343 1.1 dholland * an unlocked read of the TAILQ_NEXT pointer.
344 1.1 dholland *
345 1.1 dholland * In both cases, end up holding just dh_lock.
346 1.1 dholland */
347 1.1 dholland if (TAILQ_NEXT(dh, dh_list) != NULL) {
348 1.1 dholland DIRHASHLIST_LOCK();
349 1.1 dholland DIRHASH_LOCK(dh);
350 1.1 dholland /*
351 1.1 dholland * If the new score will be greater than that of the next
352 1.1 dholland * entry, then move this entry past it. With both mutexes
353 1.1 dholland * held, dh_next won't go away, but its dh_score could
354 1.1 dholland * change; that's not important since it is just a hint.
355 1.1 dholland */
356 1.1 dholland if (dh->dh_hash != NULL &&
357 1.1 dholland (dh_next = TAILQ_NEXT(dh, dh_list)) != NULL &&
358 1.1 dholland dh->dh_score >= dh_next->dh_score) {
359 1.1 dholland KASSERT(dh->dh_onlist);
360 1.1 dholland TAILQ_REMOVE(&ufsdirhash_list, dh, dh_list);
361 1.1 dholland TAILQ_INSERT_AFTER(&ufsdirhash_list, dh_next, dh,
362 1.1 dholland dh_list);
363 1.1 dholland }
364 1.1 dholland DIRHASHLIST_UNLOCK();
365 1.1 dholland } else {
366 1.1 dholland /* Already the last, though that could change as we wait. */
367 1.1 dholland DIRHASH_LOCK(dh);
368 1.1 dholland }
369 1.1 dholland if (dh->dh_hash == NULL) {
370 1.1 dholland DIRHASH_UNLOCK(dh);
371 1.1 dholland ufsdirhash_free(ip);
372 1.1 dholland return (EJUSTRETURN);
373 1.1 dholland }
374 1.1 dholland
375 1.1 dholland /* Update the score. */
376 1.1 dholland if (dh->dh_score < DH_SCOREMAX)
377 1.1 dholland dh->dh_score++;
378 1.1 dholland
379 1.1 dholland vp = ip->i_vnode;
380 1.1 dholland bmask = VFSTOUFS(vp->v_mount)->um_mountp->mnt_stat.f_iosize - 1;
381 1.1 dholland blkoff = -1;
382 1.1 dholland bp = NULL;
383 1.1 dholland restart:
384 1.1 dholland slot = ufsdirhash_hash(dh, name, namelen);
385 1.1 dholland
386 1.1 dholland if (dh->dh_seqopt) {
387 1.1 dholland /*
388 1.1 dholland * Sequential access optimisation. dh_seqoff contains the
389 1.1 dholland * offset of the directory entry immediately following
390 1.1 dholland * the last entry that was looked up. Check if this offset
391 1.1 dholland * appears in the hash chain for the name we are looking for.
392 1.1 dholland */
393 1.1 dholland for (i = slot; (offset = DH_ENTRY(dh, i)) != DIRHASH_EMPTY;
394 1.1 dholland i = WRAPINCR(i, dh->dh_hlen))
395 1.1 dholland if (offset == dh->dh_seqoff)
396 1.1 dholland break;
397 1.1 dholland if (offset == dh->dh_seqoff) {
398 1.1 dholland /*
399 1.1 dholland * We found an entry with the expected offset. This
400 1.1 dholland * is probably the entry we want, but if not, the
401 1.1 dholland * code below will turn off seqoff and retry.
402 1.1 dholland */
403 1.1 dholland slot = i;
404 1.1 dholland } else
405 1.1 dholland dh->dh_seqopt = 0;
406 1.1 dholland }
407 1.1 dholland
408 1.1 dholland for (; (offset = DH_ENTRY(dh, slot)) != DIRHASH_EMPTY;
409 1.1 dholland slot = WRAPINCR(slot, dh->dh_hlen)) {
410 1.1 dholland if (offset == DIRHASH_DEL)
411 1.1 dholland continue;
412 1.1 dholland
413 1.1 dholland if (offset < 0 || offset >= ip->i_size)
414 1.1 dholland panic("ufsdirhash_lookup: bad offset in hash array");
415 1.1 dholland if ((offset & ~bmask) != blkoff) {
416 1.1 dholland if (bp != NULL)
417 1.1 dholland brelse(bp, 0);
418 1.1 dholland blkoff = offset & ~bmask;
419 1.1 dholland if (ufs_blkatoff(vp, (off_t)blkoff,
420 1.1 dholland NULL, &bp, false) != 0) {
421 1.1 dholland DIRHASH_UNLOCK(dh);
422 1.1 dholland return (EJUSTRETURN);
423 1.1 dholland }
424 1.1 dholland }
425 1.1 dholland dp = (struct direct *)((char *)bp->b_data + (offset & bmask));
426 1.1 dholland if (dp->d_reclen == 0 || dp->d_reclen >
427 1.1 dholland dirblksiz - (offset & (dirblksiz - 1))) {
428 1.1 dholland /* Corrupted directory. */
429 1.1 dholland DIRHASH_UNLOCK(dh);
430 1.1 dholland brelse(bp, 0);
431 1.1 dholland return (EJUSTRETURN);
432 1.1 dholland }
433 1.1 dholland if (dp->d_namlen == namelen &&
434 1.1 dholland memcmp(dp->d_name, name, namelen) == 0) {
435 1.1 dholland /* Found. Get the prev offset if needed. */
436 1.1 dholland if (prevoffp != NULL) {
437 1.1 dholland if (offset & (dirblksiz - 1)) {
438 1.1 dholland prevoff = ufsdirhash_getprev(dp,
439 1.1 dholland offset, dirblksiz);
440 1.1 dholland if (prevoff == -1) {
441 1.1 dholland brelse(bp, 0);
442 1.1 dholland return (EJUSTRETURN);
443 1.1 dholland }
444 1.1 dholland } else
445 1.1 dholland prevoff = offset;
446 1.1 dholland *prevoffp = prevoff;
447 1.1 dholland }
448 1.1 dholland
449 1.1 dholland /* Check for sequential access, and update offset. */
450 1.1 dholland if (dh->dh_seqopt == 0 && dh->dh_seqoff == offset)
451 1.1 dholland dh->dh_seqopt = 1;
452 1.1 dholland dh->dh_seqoff = offset + DIRSIZ(0, dp, needswap);
453 1.1 dholland DIRHASH_UNLOCK(dh);
454 1.1 dholland
455 1.1 dholland *bpp = bp;
456 1.1 dholland *offp = offset;
457 1.1 dholland return (0);
458 1.1 dholland }
459 1.1 dholland
460 1.1 dholland if (dh->dh_hash == NULL) {
461 1.1 dholland DIRHASH_UNLOCK(dh);
462 1.1 dholland if (bp != NULL)
463 1.1 dholland brelse(bp, 0);
464 1.1 dholland ufsdirhash_free(ip);
465 1.1 dholland return (EJUSTRETURN);
466 1.1 dholland }
467 1.1 dholland /*
468 1.1 dholland * When the name doesn't match in the seqopt case, go back
469 1.1 dholland * and search normally.
470 1.1 dholland */
471 1.1 dholland if (dh->dh_seqopt) {
472 1.1 dholland dh->dh_seqopt = 0;
473 1.1 dholland goto restart;
474 1.1 dholland }
475 1.1 dholland }
476 1.1 dholland DIRHASH_UNLOCK(dh);
477 1.1 dholland if (bp != NULL)
478 1.1 dholland brelse(bp, 0);
479 1.1 dholland return (ENOENT);
480 1.1 dholland }
481 1.1 dholland
482 1.1 dholland /*
483 1.1 dholland * Find a directory block with room for 'slotneeded' bytes. Returns
484 1.1 dholland * the offset of the directory entry that begins the free space.
485 1.1 dholland * This will either be the offset of an existing entry that has free
486 1.1 dholland * space at the end, or the offset of an entry with d_ino == 0 at
487 1.1 dholland * the start of a DIRBLKSIZ block.
488 1.1 dholland *
489 1.1 dholland * To use the space, the caller may need to compact existing entries in
490 1.1 dholland * the directory. The total number of bytes in all of the entries involved
491 1.1 dholland * in the compaction is stored in *slotsize. In other words, all of
492 1.1 dholland * the entries that must be compacted are exactly contained in the
493 1.1 dholland * region beginning at the returned offset and spanning *slotsize bytes.
494 1.1 dholland *
495 1.1 dholland * Returns -1 if no space was found, indicating that the directory
496 1.1 dholland * must be extended.
497 1.1 dholland */
498 1.1 dholland doff_t
499 1.1 dholland ufsdirhash_findfree(struct inode *ip, int slotneeded, int *slotsize)
500 1.1 dholland {
501 1.1 dholland struct direct *dp;
502 1.1 dholland struct dirhash *dh;
503 1.1 dholland struct buf *bp;
504 1.1 dholland doff_t pos, slotstart;
505 1.1 dholland int dirblock, error, freebytes, i;
506 1.1 dholland const int needswap = UFS_MPNEEDSWAP(ip->i_ump);
507 1.1 dholland int dirblksiz = ip->i_ump->um_dirblksiz;
508 1.1 dholland
509 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
510 1.1 dholland return (-1);
511 1.1 dholland
512 1.1 dholland DIRHASH_LOCK(dh);
513 1.1 dholland if (dh->dh_hash == NULL) {
514 1.1 dholland DIRHASH_UNLOCK(dh);
515 1.1 dholland ufsdirhash_free(ip);
516 1.1 dholland return (-1);
517 1.1 dholland }
518 1.1 dholland
519 1.1 dholland /* Find a directory block with the desired free space. */
520 1.1 dholland dirblock = -1;
521 1.1 dholland for (i = howmany(slotneeded, DIRALIGN); i <= DH_NFSTATS; i++)
522 1.1 dholland if ((dirblock = dh->dh_firstfree[i]) != -1)
523 1.1 dholland break;
524 1.1 dholland if (dirblock == -1) {
525 1.1 dholland DIRHASH_UNLOCK(dh);
526 1.1 dholland return (-1);
527 1.1 dholland }
528 1.1 dholland
529 1.1 dholland KASSERT(dirblock < dh->dh_nblk &&
530 1.1 dholland dh->dh_blkfree[dirblock] >= howmany(slotneeded, DIRALIGN));
531 1.1 dholland pos = dirblock * dirblksiz;
532 1.1 dholland error = ufs_blkatoff(ip->i_vnode, (off_t)pos, (void *)&dp, &bp, false);
533 1.1 dholland if (error) {
534 1.1 dholland DIRHASH_UNLOCK(dh);
535 1.1 dholland return (-1);
536 1.1 dholland }
537 1.1 dholland /* Find the first entry with free space. */
538 1.1 dholland for (i = 0; i < dirblksiz; ) {
539 1.1 dholland if (dp->d_reclen == 0) {
540 1.1 dholland DIRHASH_UNLOCK(dh);
541 1.1 dholland brelse(bp, 0);
542 1.1 dholland return (-1);
543 1.1 dholland }
544 1.1 dholland if (dp->d_ino == 0 || dp->d_reclen > DIRSIZ(0, dp, needswap))
545 1.1 dholland break;
546 1.1 dholland i += dp->d_reclen;
547 1.1 dholland dp = (struct direct *)((char *)dp + dp->d_reclen);
548 1.1 dholland }
549 1.1 dholland if (i > dirblksiz) {
550 1.1 dholland DIRHASH_UNLOCK(dh);
551 1.1 dholland brelse(bp, 0);
552 1.1 dholland return (-1);
553 1.1 dholland }
554 1.1 dholland slotstart = pos + i;
555 1.1 dholland
556 1.1 dholland /* Find the range of entries needed to get enough space */
557 1.1 dholland freebytes = 0;
558 1.1 dholland while (i < dirblksiz && freebytes < slotneeded) {
559 1.1 dholland freebytes += dp->d_reclen;
560 1.1 dholland if (dp->d_ino != 0)
561 1.1 dholland freebytes -= DIRSIZ(0, dp, needswap);
562 1.1 dholland if (dp->d_reclen == 0) {
563 1.1 dholland DIRHASH_UNLOCK(dh);
564 1.1 dholland brelse(bp, 0);
565 1.1 dholland return (-1);
566 1.1 dholland }
567 1.1 dholland i += dp->d_reclen;
568 1.1 dholland dp = (struct direct *)((char *)dp + dp->d_reclen);
569 1.1 dholland }
570 1.1 dholland if (i > dirblksiz) {
571 1.1 dholland DIRHASH_UNLOCK(dh);
572 1.1 dholland brelse(bp, 0);
573 1.1 dholland return (-1);
574 1.1 dholland }
575 1.1 dholland if (freebytes < slotneeded)
576 1.1 dholland panic("ufsdirhash_findfree: free mismatch");
577 1.1 dholland DIRHASH_UNLOCK(dh);
578 1.1 dholland brelse(bp, 0);
579 1.1 dholland *slotsize = pos + i - slotstart;
580 1.1 dholland return (slotstart);
581 1.1 dholland }
582 1.1 dholland
583 1.1 dholland /*
584 1.1 dholland * Return the start of the unused space at the end of a directory, or
585 1.1 dholland * -1 if there are no trailing unused blocks.
586 1.1 dholland */
587 1.1 dholland doff_t
588 1.1 dholland ufsdirhash_enduseful(struct inode *ip)
589 1.1 dholland {
590 1.1 dholland struct dirhash *dh;
591 1.1 dholland int i;
592 1.1 dholland int dirblksiz = ip->i_ump->um_dirblksiz;
593 1.1 dholland
594 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
595 1.1 dholland return (-1);
596 1.1 dholland
597 1.1 dholland DIRHASH_LOCK(dh);
598 1.1 dholland if (dh->dh_hash == NULL) {
599 1.1 dholland DIRHASH_UNLOCK(dh);
600 1.1 dholland ufsdirhash_free(ip);
601 1.1 dholland return (-1);
602 1.1 dholland }
603 1.1 dholland
604 1.1 dholland if (dh->dh_blkfree[dh->dh_dirblks - 1] != dirblksiz / DIRALIGN) {
605 1.1 dholland DIRHASH_UNLOCK(dh);
606 1.1 dholland return (-1);
607 1.1 dholland }
608 1.1 dholland
609 1.1 dholland for (i = dh->dh_dirblks - 1; i >= 0; i--)
610 1.1 dholland if (dh->dh_blkfree[i] != dirblksiz / DIRALIGN)
611 1.1 dholland break;
612 1.1 dholland DIRHASH_UNLOCK(dh);
613 1.1 dholland return ((doff_t)(i + 1) * dirblksiz);
614 1.1 dholland }
615 1.1 dholland
616 1.1 dholland /*
617 1.1 dholland * Insert information into the hash about a new directory entry. dirp
618 1.1 dholland * points to a struct direct containing the entry, and offset specifies
619 1.1 dholland * the offset of this entry.
620 1.1 dholland */
621 1.1 dholland void
622 1.1 dholland ufsdirhash_add(struct inode *ip, struct direct *dirp, doff_t offset)
623 1.1 dholland {
624 1.1 dholland struct dirhash *dh;
625 1.1 dholland int slot;
626 1.1 dholland const int needswap = UFS_MPNEEDSWAP(ip->i_ump);
627 1.1 dholland int dirblksiz = ip->i_ump->um_dirblksiz;
628 1.1 dholland
629 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
630 1.1 dholland return;
631 1.1 dholland
632 1.1 dholland DIRHASH_LOCK(dh);
633 1.1 dholland if (dh->dh_hash == NULL) {
634 1.1 dholland DIRHASH_UNLOCK(dh);
635 1.1 dholland ufsdirhash_free(ip);
636 1.1 dholland return;
637 1.1 dholland }
638 1.1 dholland
639 1.1 dholland KASSERT(offset < dh->dh_dirblks * dirblksiz);
640 1.1 dholland /*
641 1.1 dholland * Normal hash usage is < 66%. If the usage gets too high then
642 1.1 dholland * remove the hash entirely and let it be rebuilt later.
643 1.1 dholland */
644 1.1 dholland if (dh->dh_hused >= (dh->dh_hlen * 3) / 4) {
645 1.1 dholland DIRHASH_UNLOCK(dh);
646 1.1 dholland ufsdirhash_free(ip);
647 1.1 dholland return;
648 1.1 dholland }
649 1.1 dholland
650 1.1 dholland /* Find a free hash slot (empty or deleted), and add the entry. */
651 1.1 dholland slot = ufsdirhash_hash(dh, dirp->d_name, dirp->d_namlen);
652 1.1 dholland while (DH_ENTRY(dh, slot) >= 0)
653 1.1 dholland slot = WRAPINCR(slot, dh->dh_hlen);
654 1.1 dholland if (DH_ENTRY(dh, slot) == DIRHASH_EMPTY)
655 1.1 dholland dh->dh_hused++;
656 1.1 dholland DH_ENTRY(dh, slot) = offset;
657 1.1 dholland
658 1.1 dholland /* Update the per-block summary info. */
659 1.1 dholland ufsdirhash_adjfree(dh, offset, -DIRSIZ(0, dirp, needswap), dirblksiz);
660 1.1 dholland DIRHASH_UNLOCK(dh);
661 1.1 dholland }
662 1.1 dholland
663 1.1 dholland /*
664 1.1 dholland * Remove the specified directory entry from the hash. The entry to remove
665 1.1 dholland * is defined by the name in `dirp', which must exist at the specified
666 1.1 dholland * `offset' within the directory.
667 1.1 dholland */
668 1.1 dholland void
669 1.1 dholland ufsdirhash_remove(struct inode *ip, struct direct *dirp, doff_t offset)
670 1.1 dholland {
671 1.1 dholland struct dirhash *dh;
672 1.1 dholland int slot;
673 1.1 dholland const int needswap = UFS_MPNEEDSWAP(ip->i_ump);
674 1.1 dholland int dirblksiz = ip->i_ump->um_dirblksiz;
675 1.1 dholland
676 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
677 1.1 dholland return;
678 1.1 dholland
679 1.1 dholland DIRHASH_LOCK(dh);
680 1.1 dholland if (dh->dh_hash == NULL) {
681 1.1 dholland DIRHASH_UNLOCK(dh);
682 1.1 dholland ufsdirhash_free(ip);
683 1.1 dholland return;
684 1.1 dholland }
685 1.1 dholland
686 1.1 dholland KASSERT(offset < dh->dh_dirblks * dirblksiz);
687 1.1 dholland /* Find the entry */
688 1.1 dholland slot = ufsdirhash_findslot(dh, dirp->d_name, dirp->d_namlen, offset);
689 1.1 dholland
690 1.1 dholland /* Remove the hash entry. */
691 1.1 dholland ufsdirhash_delslot(dh, slot);
692 1.1 dholland
693 1.1 dholland /* Update the per-block summary info. */
694 1.1 dholland ufsdirhash_adjfree(dh, offset, DIRSIZ(0, dirp, needswap), dirblksiz);
695 1.1 dholland DIRHASH_UNLOCK(dh);
696 1.1 dholland }
697 1.1 dholland
698 1.1 dholland /*
699 1.1 dholland * Change the offset associated with a directory entry in the hash. Used
700 1.1 dholland * when compacting directory blocks.
701 1.1 dholland */
702 1.1 dholland void
703 1.1 dholland ufsdirhash_move(struct inode *ip, struct direct *dirp, doff_t oldoff,
704 1.1 dholland doff_t newoff)
705 1.1 dholland {
706 1.1 dholland struct dirhash *dh;
707 1.1 dholland int slot;
708 1.1 dholland
709 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
710 1.1 dholland return;
711 1.1 dholland DIRHASH_LOCK(dh);
712 1.1 dholland if (dh->dh_hash == NULL) {
713 1.1 dholland DIRHASH_UNLOCK(dh);
714 1.1 dholland ufsdirhash_free(ip);
715 1.1 dholland return;
716 1.1 dholland }
717 1.1 dholland
718 1.1 dholland KASSERT(oldoff < dh->dh_dirblks * ip->i_ump->um_dirblksiz &&
719 1.1 dholland newoff < dh->dh_dirblks * ip->i_ump->um_dirblksiz);
720 1.1 dholland /* Find the entry, and update the offset. */
721 1.1 dholland slot = ufsdirhash_findslot(dh, dirp->d_name, dirp->d_namlen, oldoff);
722 1.1 dholland DH_ENTRY(dh, slot) = newoff;
723 1.1 dholland DIRHASH_UNLOCK(dh);
724 1.1 dholland }
725 1.1 dholland
726 1.1 dholland /*
727 1.1 dholland * Inform dirhash that the directory has grown by one block that
728 1.1 dholland * begins at offset (i.e. the new length is offset + DIRBLKSIZ).
729 1.1 dholland */
730 1.1 dholland void
731 1.1 dholland ufsdirhash_newblk(struct inode *ip, doff_t offset)
732 1.1 dholland {
733 1.1 dholland struct dirhash *dh;
734 1.1 dholland int block;
735 1.1 dholland int dirblksiz = ip->i_ump->um_dirblksiz;
736 1.1 dholland
737 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
738 1.1 dholland return;
739 1.1 dholland DIRHASH_LOCK(dh);
740 1.1 dholland if (dh->dh_hash == NULL) {
741 1.1 dholland DIRHASH_UNLOCK(dh);
742 1.1 dholland ufsdirhash_free(ip);
743 1.1 dholland return;
744 1.1 dholland }
745 1.1 dholland
746 1.1 dholland KASSERT(offset == dh->dh_dirblks * dirblksiz);
747 1.1 dholland block = offset / dirblksiz;
748 1.1 dholland if (block >= dh->dh_nblk) {
749 1.1 dholland /* Out of space; must rebuild. */
750 1.1 dholland DIRHASH_UNLOCK(dh);
751 1.1 dholland ufsdirhash_free(ip);
752 1.1 dholland return;
753 1.1 dholland }
754 1.1 dholland dh->dh_dirblks = block + 1;
755 1.1 dholland
756 1.1 dholland /* Account for the new free block. */
757 1.1 dholland dh->dh_blkfree[block] = dirblksiz / DIRALIGN;
758 1.1 dholland if (dh->dh_firstfree[DH_NFSTATS] == -1)
759 1.1 dholland dh->dh_firstfree[DH_NFSTATS] = block;
760 1.1 dholland DIRHASH_UNLOCK(dh);
761 1.1 dholland }
762 1.1 dholland
763 1.1 dholland /*
764 1.1 dholland * Inform dirhash that the directory is being truncated.
765 1.1 dholland */
766 1.1 dholland void
767 1.1 dholland ufsdirhash_dirtrunc(struct inode *ip, doff_t offset)
768 1.1 dholland {
769 1.1 dholland struct dirhash *dh;
770 1.1 dholland int block, i;
771 1.1 dholland int dirblksiz = ip->i_ump->um_dirblksiz;
772 1.1 dholland
773 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
774 1.1 dholland return;
775 1.1 dholland
776 1.1 dholland DIRHASH_LOCK(dh);
777 1.1 dholland if (dh->dh_hash == NULL) {
778 1.1 dholland DIRHASH_UNLOCK(dh);
779 1.1 dholland ufsdirhash_free(ip);
780 1.1 dholland return;
781 1.1 dholland }
782 1.1 dholland
783 1.1 dholland KASSERT(offset <= dh->dh_dirblks * dirblksiz);
784 1.1 dholland block = howmany(offset, dirblksiz);
785 1.1 dholland /*
786 1.1 dholland * If the directory shrinks to less than 1/8 of dh_nblk blocks
787 1.1 dholland * (about 20% of its original size due to the 50% extra added in
788 1.1 dholland * ufsdirhash_build) then free it, and let the caller rebuild
789 1.1 dholland * if necessary.
790 1.1 dholland */
791 1.1 dholland if (block < dh->dh_nblk / 8 && dh->dh_narrays > 1) {
792 1.1 dholland DIRHASH_UNLOCK(dh);
793 1.1 dholland ufsdirhash_free(ip);
794 1.1 dholland return;
795 1.1 dholland }
796 1.1 dholland
797 1.1 dholland /*
798 1.1 dholland * Remove any `first free' information pertaining to the
799 1.1 dholland * truncated blocks. All blocks we're removing should be
800 1.1 dholland * completely unused.
801 1.1 dholland */
802 1.1 dholland if (dh->dh_firstfree[DH_NFSTATS] >= block)
803 1.1 dholland dh->dh_firstfree[DH_NFSTATS] = -1;
804 1.1 dholland for (i = block; i < dh->dh_dirblks; i++)
805 1.1 dholland if (dh->dh_blkfree[i] != dirblksiz / DIRALIGN)
806 1.1 dholland panic("ufsdirhash_dirtrunc: blocks in use");
807 1.1 dholland for (i = 0; i < DH_NFSTATS; i++)
808 1.1 dholland if (dh->dh_firstfree[i] >= block)
809 1.1 dholland panic("ufsdirhash_dirtrunc: first free corrupt");
810 1.1 dholland dh->dh_dirblks = block;
811 1.1 dholland DIRHASH_UNLOCK(dh);
812 1.1 dholland }
813 1.1 dholland
814 1.1 dholland /*
815 1.1 dholland * Debugging function to check that the dirhash information about
816 1.1 dholland * a directory block matches its actual contents. Panics if a mismatch
817 1.1 dholland * is detected.
818 1.1 dholland *
819 1.1 dholland * On entry, `sbuf' should point to the start of an in-core
820 1.1 dholland * DIRBLKSIZ-sized directory block, and `offset' should contain the
821 1.1 dholland * offset from the start of the directory of that block.
822 1.1 dholland */
823 1.1 dholland void
824 1.1 dholland ufsdirhash_checkblock(struct inode *ip, char *sbuf, doff_t offset)
825 1.1 dholland {
826 1.1 dholland struct dirhash *dh;
827 1.1 dholland struct direct *dp;
828 1.1 dholland int block, ffslot, i, nfree;
829 1.1 dholland const int needswap = UFS_MPNEEDSWAP(ip->i_ump);
830 1.1 dholland int dirblksiz = ip->i_ump->um_dirblksiz;
831 1.1 dholland
832 1.1 dholland if (!ufs_dirhashcheck)
833 1.1 dholland return;
834 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
835 1.1 dholland return;
836 1.1 dholland
837 1.1 dholland DIRHASH_LOCK(dh);
838 1.1 dholland if (dh->dh_hash == NULL) {
839 1.1 dholland DIRHASH_UNLOCK(dh);
840 1.1 dholland ufsdirhash_free(ip);
841 1.1 dholland return;
842 1.1 dholland }
843 1.1 dholland
844 1.1 dholland block = offset / dirblksiz;
845 1.1 dholland if ((offset & (dirblksiz - 1)) != 0 || block >= dh->dh_dirblks)
846 1.1 dholland panic("ufsdirhash_checkblock: bad offset");
847 1.1 dholland
848 1.1 dholland nfree = 0;
849 1.1 dholland for (i = 0; i < dirblksiz; i += dp->d_reclen) {
850 1.1 dholland dp = (struct direct *)(sbuf + i);
851 1.1 dholland if (dp->d_reclen == 0 || i + dp->d_reclen > dirblksiz)
852 1.1 dholland panic("ufsdirhash_checkblock: bad dir");
853 1.1 dholland
854 1.1 dholland if (dp->d_ino == 0) {
855 1.1 dholland #if 0
856 1.1 dholland /*
857 1.1 dholland * XXX entries with d_ino == 0 should only occur
858 1.1 dholland * at the start of a DIRBLKSIZ block. However the
859 1.1 dholland * ufs code is tolerant of such entries at other
860 1.1 dholland * offsets, and fsck does not fix them.
861 1.1 dholland */
862 1.1 dholland if (i != 0)
863 1.1 dholland panic("ufsdirhash_checkblock: bad dir inode");
864 1.1 dholland #endif
865 1.1 dholland nfree += dp->d_reclen;
866 1.1 dholland continue;
867 1.1 dholland }
868 1.1 dholland
869 1.1 dholland /* Check that the entry exists (will panic if it doesn't). */
870 1.1 dholland ufsdirhash_findslot(dh, dp->d_name, dp->d_namlen, offset + i);
871 1.1 dholland
872 1.1 dholland nfree += dp->d_reclen - DIRSIZ(0, dp, needswap);
873 1.1 dholland }
874 1.1 dholland if (i != dirblksiz)
875 1.1 dholland panic("ufsdirhash_checkblock: bad dir end");
876 1.1 dholland
877 1.1 dholland if (dh->dh_blkfree[block] * DIRALIGN != nfree)
878 1.1 dholland panic("ufsdirhash_checkblock: bad free count");
879 1.1 dholland
880 1.1 dholland ffslot = BLKFREE2IDX(nfree / DIRALIGN);
881 1.1 dholland for (i = 0; i <= DH_NFSTATS; i++)
882 1.1 dholland if (dh->dh_firstfree[i] == block && i != ffslot)
883 1.1 dholland panic("ufsdirhash_checkblock: bad first-free");
884 1.1 dholland if (dh->dh_firstfree[ffslot] == -1)
885 1.1 dholland panic("ufsdirhash_checkblock: missing first-free entry");
886 1.1 dholland DIRHASH_UNLOCK(dh);
887 1.1 dholland }
888 1.1 dholland
889 1.1 dholland /*
890 1.1 dholland * Hash the specified filename into a dirhash slot.
891 1.1 dholland */
892 1.1 dholland static int
893 1.1 dholland ufsdirhash_hash(struct dirhash *dh, const char *name, int namelen)
894 1.1 dholland {
895 1.1 dholland u_int32_t hash;
896 1.1 dholland
897 1.1 dholland /*
898 1.1 dholland * We hash the name and then some other bit of data that is
899 1.1 dholland * invariant over the dirhash's lifetime. Otherwise names
900 1.1 dholland * differing only in the last byte are placed close to one
901 1.1 dholland * another in the table, which is bad for linear probing.
902 1.1 dholland */
903 1.1 dholland hash = hash32_buf(name, namelen, HASH32_BUF_INIT);
904 1.1 dholland hash = hash32_buf(&dh, sizeof(dh), hash);
905 1.1 dholland return (hash % dh->dh_hlen);
906 1.1 dholland }
907 1.1 dholland
908 1.1 dholland /*
909 1.1 dholland * Adjust the number of free bytes in the block containing `offset'
910 1.1 dholland * by the value specified by `diff'.
911 1.1 dholland *
912 1.1 dholland * The caller must ensure we have exclusive access to `dh'; normally
913 1.1 dholland * that means that dh_lock should be held, but this is also called
914 1.1 dholland * from ufsdirhash_build() where exclusive access can be assumed.
915 1.1 dholland */
916 1.1 dholland static void
917 1.1 dholland ufsdirhash_adjfree(struct dirhash *dh, doff_t offset, int diff, int dirblksiz)
918 1.1 dholland {
919 1.1 dholland int block, i, nfidx, ofidx;
920 1.1 dholland
921 1.1 dholland KASSERT(mutex_owned(&dh->dh_lock));
922 1.1 dholland
923 1.1 dholland /* Update the per-block summary info. */
924 1.1 dholland block = offset / dirblksiz;
925 1.1 dholland KASSERT(block < dh->dh_nblk && block < dh->dh_dirblks);
926 1.1 dholland ofidx = BLKFREE2IDX(dh->dh_blkfree[block]);
927 1.1 dholland dh->dh_blkfree[block] = (int)dh->dh_blkfree[block] + (diff / DIRALIGN);
928 1.1 dholland nfidx = BLKFREE2IDX(dh->dh_blkfree[block]);
929 1.1 dholland
930 1.1 dholland /* Update the `first free' list if necessary. */
931 1.1 dholland if (ofidx != nfidx) {
932 1.1 dholland /* If removing, scan forward for the next block. */
933 1.1 dholland if (dh->dh_firstfree[ofidx] == block) {
934 1.1 dholland for (i = block + 1; i < dh->dh_dirblks; i++)
935 1.1 dholland if (BLKFREE2IDX(dh->dh_blkfree[i]) == ofidx)
936 1.1 dholland break;
937 1.1 dholland dh->dh_firstfree[ofidx] = (i < dh->dh_dirblks) ? i : -1;
938 1.1 dholland }
939 1.1 dholland
940 1.1 dholland /* Make this the new `first free' if necessary */
941 1.1 dholland if (dh->dh_firstfree[nfidx] > block ||
942 1.1 dholland dh->dh_firstfree[nfidx] == -1)
943 1.1 dholland dh->dh_firstfree[nfidx] = block;
944 1.1 dholland }
945 1.1 dholland }
946 1.1 dholland
947 1.1 dholland /*
948 1.1 dholland * Find the specified name which should have the specified offset.
949 1.1 dholland * Returns a slot number, and panics on failure.
950 1.1 dholland *
951 1.1 dholland * `dh' must be locked on entry and remains so on return.
952 1.1 dholland */
953 1.1 dholland static int
954 1.1 dholland ufsdirhash_findslot(struct dirhash *dh, const char *name, int namelen,
955 1.1 dholland doff_t offset)
956 1.1 dholland {
957 1.1 dholland int slot;
958 1.1 dholland
959 1.1 dholland KASSERT(mutex_owned(&dh->dh_lock));
960 1.1 dholland
961 1.1 dholland /* Find the entry. */
962 1.1 dholland KASSERT(dh->dh_hused < dh->dh_hlen);
963 1.1 dholland slot = ufsdirhash_hash(dh, name, namelen);
964 1.1 dholland while (DH_ENTRY(dh, slot) != offset &&
965 1.1 dholland DH_ENTRY(dh, slot) != DIRHASH_EMPTY)
966 1.1 dholland slot = WRAPINCR(slot, dh->dh_hlen);
967 1.1 dholland if (DH_ENTRY(dh, slot) != offset)
968 1.1 dholland panic("ufsdirhash_findslot: '%.*s' not found", namelen, name);
969 1.1 dholland
970 1.1 dholland return (slot);
971 1.1 dholland }
972 1.1 dholland
973 1.1 dholland /*
974 1.1 dholland * Remove the entry corresponding to the specified slot from the hash array.
975 1.1 dholland *
976 1.1 dholland * `dh' must be locked on entry and remains so on return.
977 1.1 dholland */
978 1.1 dholland static void
979 1.1 dholland ufsdirhash_delslot(struct dirhash *dh, int slot)
980 1.1 dholland {
981 1.1 dholland int i;
982 1.1 dholland
983 1.1 dholland KASSERT(mutex_owned(&dh->dh_lock));
984 1.1 dholland
985 1.1 dholland /* Mark the entry as deleted. */
986 1.1 dholland DH_ENTRY(dh, slot) = DIRHASH_DEL;
987 1.1 dholland
988 1.1 dholland /* If this is the end of a chain of DIRHASH_DEL slots, remove them. */
989 1.1 dholland for (i = slot; DH_ENTRY(dh, i) == DIRHASH_DEL; )
990 1.1 dholland i = WRAPINCR(i, dh->dh_hlen);
991 1.1 dholland if (DH_ENTRY(dh, i) == DIRHASH_EMPTY) {
992 1.1 dholland i = WRAPDECR(i, dh->dh_hlen);
993 1.1 dholland while (DH_ENTRY(dh, i) == DIRHASH_DEL) {
994 1.1 dholland DH_ENTRY(dh, i) = DIRHASH_EMPTY;
995 1.1 dholland dh->dh_hused--;
996 1.1 dholland i = WRAPDECR(i, dh->dh_hlen);
997 1.1 dholland }
998 1.1 dholland KASSERT(dh->dh_hused >= 0);
999 1.1 dholland }
1000 1.1 dholland }
1001 1.1 dholland
1002 1.1 dholland /*
1003 1.1 dholland * Given a directory entry and its offset, find the offset of the
1004 1.1 dholland * previous entry in the same DIRBLKSIZ-sized block. Returns an
1005 1.1 dholland * offset, or -1 if there is no previous entry in the block or some
1006 1.1 dholland * other problem occurred.
1007 1.1 dholland */
1008 1.1 dholland static doff_t
1009 1.1 dholland ufsdirhash_getprev(struct direct *dirp, doff_t offset, int dirblksiz)
1010 1.1 dholland {
1011 1.1 dholland struct direct *dp;
1012 1.1 dholland char *blkbuf;
1013 1.1 dholland doff_t blkoff, prevoff;
1014 1.1 dholland int entrypos, i;
1015 1.1 dholland
1016 1.1 dholland blkoff = offset & ~(dirblksiz - 1); /* offset of start of block */
1017 1.1 dholland entrypos = offset & (dirblksiz - 1); /* entry relative to block */
1018 1.1 dholland blkbuf = (char *)dirp - entrypos;
1019 1.1 dholland prevoff = blkoff;
1020 1.1 dholland
1021 1.1 dholland /* If `offset' is the start of a block, there is no previous entry. */
1022 1.1 dholland if (entrypos == 0)
1023 1.1 dholland return (-1);
1024 1.1 dholland
1025 1.1 dholland /* Scan from the start of the block until we get to the entry. */
1026 1.1 dholland for (i = 0; i < entrypos; i += dp->d_reclen) {
1027 1.1 dholland dp = (struct direct *)(blkbuf + i);
1028 1.1 dholland if (dp->d_reclen == 0 || i + dp->d_reclen > entrypos)
1029 1.1 dholland return (-1); /* Corrupted directory. */
1030 1.1 dholland prevoff = blkoff + i;
1031 1.1 dholland }
1032 1.1 dholland return (prevoff);
1033 1.1 dholland }
1034 1.1 dholland
1035 1.1 dholland /*
1036 1.1 dholland * Try to free up `wanted' bytes by stealing memory from existing
1037 1.1 dholland * dirhashes. Returns zero with list locked if successful.
1038 1.1 dholland */
1039 1.1 dholland static int
1040 1.1 dholland ufsdirhash_recycle(int wanted)
1041 1.1 dholland {
1042 1.1 dholland struct dirhash *dh;
1043 1.1 dholland doff_t **hash;
1044 1.1 dholland u_int8_t *blkfree;
1045 1.1 dholland int i, mem, narrays;
1046 1.1 dholland size_t hashsz, blkfreesz;
1047 1.1 dholland
1048 1.1 dholland DIRHASHLIST_LOCK();
1049 1.1 dholland while (wanted + ufs_dirhashmem > ufs_dirhashmaxmem) {
1050 1.1 dholland /* Find a dirhash, and lock it. */
1051 1.1 dholland if ((dh = TAILQ_FIRST(&ufsdirhash_list)) == NULL) {
1052 1.1 dholland DIRHASHLIST_UNLOCK();
1053 1.1 dholland return (-1);
1054 1.1 dholland }
1055 1.1 dholland DIRHASH_LOCK(dh);
1056 1.1 dholland KASSERT(dh->dh_hash != NULL);
1057 1.1 dholland
1058 1.1 dholland /* Decrement the score; only recycle if it becomes zero. */
1059 1.1 dholland if (--dh->dh_score > 0) {
1060 1.1 dholland DIRHASH_UNLOCK(dh);
1061 1.1 dholland DIRHASHLIST_UNLOCK();
1062 1.1 dholland return (-1);
1063 1.1 dholland }
1064 1.1 dholland
1065 1.1 dholland /* Remove it from the list and detach its memory. */
1066 1.1 dholland TAILQ_REMOVE(&ufsdirhash_list, dh, dh_list);
1067 1.1 dholland dh->dh_onlist = 0;
1068 1.1 dholland hash = dh->dh_hash;
1069 1.1 dholland hashsz = dh->dh_hashsz;
1070 1.1 dholland dh->dh_hash = NULL;
1071 1.1 dholland blkfree = dh->dh_blkfree;
1072 1.1 dholland blkfreesz = dh->dh_blkfreesz;
1073 1.1 dholland dh->dh_blkfree = NULL;
1074 1.1 dholland narrays = dh->dh_narrays;
1075 1.1 dholland mem = narrays * sizeof(*dh->dh_hash) +
1076 1.1 dholland narrays * DH_NBLKOFF * sizeof(**dh->dh_hash) +
1077 1.1 dholland dh->dh_nblk * sizeof(*dh->dh_blkfree);
1078 1.1 dholland
1079 1.1 dholland /* Unlock everything, free the detached memory. */
1080 1.1 dholland DIRHASH_UNLOCK(dh);
1081 1.1 dholland DIRHASHLIST_UNLOCK();
1082 1.1 dholland
1083 1.1 dholland for (i = 0; i < narrays; i++)
1084 1.1 dholland DIRHASH_BLKFREE(hash[i]);
1085 1.1 dholland kmem_free(hash, hashsz);
1086 1.1 dholland kmem_free(blkfree, blkfreesz);
1087 1.1 dholland
1088 1.1 dholland /* Account for the returned memory, and repeat if necessary. */
1089 1.1 dholland DIRHASHLIST_LOCK();
1090 1.1 dholland atomic_add_int(&ufs_dirhashmem, -mem);
1091 1.1 dholland }
1092 1.1 dholland /* Success. */
1093 1.1 dholland return (0);
1094 1.1 dholland }
1095 1.1 dholland
1096 1.1 dholland static void
1097 1.1 dholland ufsdirhash_sysctl_init(void)
1098 1.1 dholland {
1099 1.1 dholland const struct sysctlnode *rnode, *cnode;
1100 1.1 dholland
1101 1.1 dholland sysctl_createv(&ufsdirhash_sysctl_log, 0, NULL, &rnode,
1102 1.1 dholland CTLFLAG_PERMANENT,
1103 1.1 dholland CTLTYPE_NODE, "vfs", NULL,
1104 1.1 dholland NULL, 0, NULL, 0,
1105 1.1 dholland CTL_VFS, CTL_EOL);
1106 1.1 dholland
1107 1.1 dholland sysctl_createv(&ufsdirhash_sysctl_log, 0, &rnode, &rnode,
1108 1.1 dholland CTLFLAG_PERMANENT,
1109 1.1 dholland CTLTYPE_NODE, "ufs",
1110 1.1 dholland SYSCTL_DESCR("ufs"),
1111 1.1 dholland NULL, 0, NULL, 0,
1112 1.1 dholland CTL_CREATE, CTL_EOL);
1113 1.1 dholland
1114 1.1 dholland sysctl_createv(&ufsdirhash_sysctl_log, 0, &rnode, &rnode,
1115 1.1 dholland CTLFLAG_PERMANENT,
1116 1.1 dholland CTLTYPE_NODE, "dirhash",
1117 1.1 dholland SYSCTL_DESCR("dirhash"),
1118 1.1 dholland NULL, 0, NULL, 0,
1119 1.1 dholland CTL_CREATE, CTL_EOL);
1120 1.1 dholland
1121 1.1 dholland sysctl_createv(&ufsdirhash_sysctl_log, 0, &rnode, &cnode,
1122 1.1 dholland CTLFLAG_PERMANENT|CTLFLAG_READWRITE,
1123 1.1 dholland CTLTYPE_INT, "minblocks",
1124 1.1 dholland SYSCTL_DESCR("minimum hashed directory size in blocks"),
1125 1.1 dholland NULL, 0, &ufs_dirhashminblks, 0,
1126 1.1 dholland CTL_CREATE, CTL_EOL);
1127 1.1 dholland
1128 1.1 dholland sysctl_createv(&ufsdirhash_sysctl_log, 0, &rnode, &cnode,
1129 1.1 dholland CTLFLAG_PERMANENT|CTLFLAG_READWRITE,
1130 1.1 dholland CTLTYPE_INT, "maxmem",
1131 1.1 dholland SYSCTL_DESCR("maximum dirhash memory usage"),
1132 1.1 dholland NULL, 0, &ufs_dirhashmaxmem, 0,
1133 1.1 dholland CTL_CREATE, CTL_EOL);
1134 1.1 dholland
1135 1.1 dholland sysctl_createv(&ufsdirhash_sysctl_log, 0, &rnode, &cnode,
1136 1.1 dholland CTLFLAG_PERMANENT|CTLFLAG_READONLY,
1137 1.1 dholland CTLTYPE_INT, "memused",
1138 1.1 dholland SYSCTL_DESCR("current dirhash memory usage"),
1139 1.1 dholland NULL, 0, &ufs_dirhashmem, 0,
1140 1.1 dholland CTL_CREATE, CTL_EOL);
1141 1.1 dholland
1142 1.1 dholland sysctl_createv(&ufsdirhash_sysctl_log, 0, &rnode, &cnode,
1143 1.1 dholland CTLFLAG_PERMANENT|CTLFLAG_READWRITE,
1144 1.1 dholland CTLTYPE_INT, "docheck",
1145 1.1 dholland SYSCTL_DESCR("enable extra sanity checks"),
1146 1.1 dholland NULL, 0, &ufs_dirhashcheck, 0,
1147 1.1 dholland CTL_CREATE, CTL_EOL);
1148 1.1 dholland }
1149 1.1 dholland
1150 1.1 dholland void
1151 1.1 dholland ufsdirhash_init(void)
1152 1.1 dholland {
1153 1.1 dholland
1154 1.1 dholland mutex_init(&ufsdirhash_lock, MUTEX_DEFAULT, IPL_NONE);
1155 1.1 dholland ufsdirhashblk_cache = pool_cache_init(DH_NBLKOFF * sizeof(daddr_t), 0,
1156 1.1 dholland 0, 0, "dirhashblk", NULL, IPL_NONE, NULL, NULL, NULL);
1157 1.1 dholland ufsdirhash_cache = pool_cache_init(sizeof(struct dirhash), 0,
1158 1.1 dholland 0, 0, "dirhash", NULL, IPL_NONE, NULL, NULL, NULL);
1159 1.1 dholland TAILQ_INIT(&ufsdirhash_list);
1160 1.1 dholland ufsdirhash_sysctl_init();
1161 1.1 dholland }
1162 1.1 dholland
1163 1.1 dholland void
1164 1.1 dholland ufsdirhash_done(void)
1165 1.1 dholland {
1166 1.1 dholland
1167 1.1 dholland KASSERT(TAILQ_EMPTY(&ufsdirhash_list));
1168 1.1 dholland pool_cache_destroy(ufsdirhashblk_cache);
1169 1.1 dholland pool_cache_destroy(ufsdirhash_cache);
1170 1.1 dholland mutex_destroy(&ufsdirhash_lock);
1171 1.1 dholland sysctl_teardown(&ufsdirhash_sysctl_log);
1172 1.1 dholland }
1173