ulfs_dirhash.c revision 1.17 1 1.17 dholland /* $NetBSD: ulfs_dirhash.c,v 1.17 2016/06/20 01:53:38 dholland Exp $ */
2 1.17 dholland /* from NetBSD: ufs_dirhash.c,v 1.37 2014/12/20 00:28:05 christos Exp */
3 1.1 dholland
4 1.1 dholland /*
5 1.1 dholland * Copyright (c) 2001, 2002 Ian Dowse. All rights reserved.
6 1.1 dholland *
7 1.1 dholland * Redistribution and use in source and binary forms, with or without
8 1.1 dholland * modification, are permitted provided that the following conditions
9 1.1 dholland * are met:
10 1.1 dholland * 1. Redistributions of source code must retain the above copyright
11 1.1 dholland * notice, this list of conditions and the following disclaimer.
12 1.1 dholland * 2. Redistributions in binary form must reproduce the above copyright
13 1.1 dholland * notice, this list of conditions and the following disclaimer in the
14 1.1 dholland * documentation and/or other materials provided with the distribution.
15 1.1 dholland *
16 1.1 dholland * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
17 1.1 dholland * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18 1.1 dholland * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19 1.1 dholland * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
20 1.1 dholland * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21 1.1 dholland * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
22 1.1 dholland * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23 1.1 dholland * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
24 1.1 dholland * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25 1.1 dholland * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26 1.1 dholland * SUCH DAMAGE.
27 1.1 dholland *
28 1.1 dholland * $FreeBSD: src/sys/ufs/ufs/ufs_dirhash.c,v 1.3.2.8 2004/12/08 11:54:13 dwmalone Exp $
29 1.1 dholland */
30 1.1 dholland
31 1.1 dholland #include <sys/cdefs.h>
32 1.17 dholland __KERNEL_RCSID(0, "$NetBSD: ulfs_dirhash.c,v 1.17 2016/06/20 01:53:38 dholland Exp $");
33 1.1 dholland
34 1.1 dholland /*
35 1.3 dholland * This implements a hash-based lookup scheme for ULFS directories.
36 1.1 dholland */
37 1.1 dholland
38 1.1 dholland #include <sys/param.h>
39 1.1 dholland #include <sys/systm.h>
40 1.1 dholland #include <sys/kernel.h>
41 1.1 dholland #include <sys/kmem.h>
42 1.1 dholland #include <sys/types.h>
43 1.1 dholland #include <sys/hash.h>
44 1.1 dholland #include <sys/proc.h>
45 1.1 dholland #include <sys/buf.h>
46 1.1 dholland #include <sys/vnode.h>
47 1.1 dholland #include <sys/mount.h>
48 1.1 dholland #include <sys/pool.h>
49 1.1 dholland #include <sys/sysctl.h>
50 1.1 dholland #include <sys/atomic.h>
51 1.1 dholland
52 1.9 dholland #include <ufs/lfs/lfs.h>
53 1.9 dholland #include <ufs/lfs/lfs_accessors.h>
54 1.2 dholland #include <ufs/lfs/ulfs_inode.h>
55 1.2 dholland #include <ufs/lfs/ulfs_dirhash.h>
56 1.2 dholland #include <ufs/lfs/ulfsmount.h>
57 1.2 dholland #include <ufs/lfs/ulfs_bswap.h>
58 1.2 dholland #include <ufs/lfs/ulfs_extern.h>
59 1.1 dholland
60 1.1 dholland #define WRAPINCR(val, limit) (((val) + 1 == (limit)) ? 0 : ((val) + 1))
61 1.1 dholland #define WRAPDECR(val, limit) (((val) == 0) ? ((limit) - 1) : ((val) - 1))
62 1.7 dholland #define OFSFMT(ip) ((ip)->i_lfs->um_maxsymlinklen <= 0)
63 1.1 dholland #define BLKFREE2IDX(n) ((n) > DH_NFSTATS ? DH_NFSTATS : (n))
64 1.1 dholland
65 1.3 dholland static u_int ulfs_dirhashminblks = 5;
66 1.3 dholland static u_int ulfs_dirhashmaxmem = 2 * 1024 * 1024;
67 1.3 dholland static u_int ulfs_dirhashmem;
68 1.3 dholland static u_int ulfs_dirhashcheck = 0;
69 1.1 dholland
70 1.3 dholland static int ulfsdirhash_hash(struct dirhash *dh, const char *name, int namelen);
71 1.3 dholland static void ulfsdirhash_adjfree(struct dirhash *dh, doff_t offset, int diff,
72 1.1 dholland int dirblksiz);
73 1.3 dholland static void ulfsdirhash_delslot(struct dirhash *dh, int slot);
74 1.3 dholland static int ulfsdirhash_findslot(struct dirhash *dh, const char *name,
75 1.1 dholland int namelen, doff_t offset);
76 1.14 dholland static doff_t ulfsdirhash_getprev(struct lfs *fs, LFS_DIRHEADER *dp,
77 1.10 dholland doff_t offset, int dirblksiz);
78 1.3 dholland static int ulfsdirhash_recycle(int wanted);
79 1.1 dholland
80 1.3 dholland static pool_cache_t ulfsdirhashblk_cache;
81 1.3 dholland static pool_cache_t ulfsdirhash_cache;
82 1.1 dholland
83 1.3 dholland #define DIRHASHLIST_LOCK() mutex_enter(&ulfsdirhash_lock)
84 1.3 dholland #define DIRHASHLIST_UNLOCK() mutex_exit(&ulfsdirhash_lock)
85 1.1 dholland #define DIRHASH_LOCK(dh) mutex_enter(&(dh)->dh_lock)
86 1.1 dholland #define DIRHASH_UNLOCK(dh) mutex_exit(&(dh)->dh_lock)
87 1.1 dholland #define DIRHASH_BLKALLOC() \
88 1.3 dholland pool_cache_get(ulfsdirhashblk_cache, PR_NOWAIT)
89 1.1 dholland #define DIRHASH_BLKFREE(ptr) \
90 1.3 dholland pool_cache_put(ulfsdirhashblk_cache, ptr)
91 1.1 dholland
92 1.1 dholland /* Dirhash list; recently-used entries are near the tail. */
93 1.3 dholland static TAILQ_HEAD(, dirhash) ulfsdirhash_list;
94 1.1 dholland
95 1.3 dholland /* Protects: ulfsdirhash_list, `dh_list' field, ulfs_dirhashmem. */
96 1.3 dholland static kmutex_t ulfsdirhash_lock;
97 1.1 dholland
98 1.3 dholland static struct sysctllog *ulfsdirhash_sysctl_log;
99 1.1 dholland
100 1.1 dholland /*
101 1.1 dholland * Locking order:
102 1.3 dholland * ulfsdirhash_lock
103 1.1 dholland * dh_lock
104 1.1 dholland *
105 1.1 dholland * The dh_lock mutex should be acquired either via the inode lock, or via
106 1.3 dholland * ulfsdirhash_lock. Only the owner of the inode may free the associated
107 1.1 dholland * dirhash, but anything can steal its memory and set dh_hash to NULL.
108 1.1 dholland */
109 1.1 dholland
110 1.1 dholland /*
111 1.1 dholland * Attempt to build up a hash table for the directory contents in
112 1.1 dholland * inode 'ip'. Returns 0 on success, or -1 of the operation failed.
113 1.1 dholland */
114 1.1 dholland int
115 1.3 dholland ulfsdirhash_build(struct inode *ip)
116 1.1 dholland {
117 1.9 dholland struct lfs *fs = ip->i_lfs;
118 1.1 dholland struct dirhash *dh;
119 1.1 dholland struct buf *bp = NULL;
120 1.14 dholland LFS_DIRHEADER *ep;
121 1.1 dholland struct vnode *vp;
122 1.1 dholland doff_t bmask, pos;
123 1.1 dholland int dirblocks, i, j, memreqd, nblocks, narrays, nslots, slot;
124 1.7 dholland int dirblksiz = ip->i_lfs->um_dirblksiz;
125 1.1 dholland
126 1.1 dholland /* Check if we can/should use dirhash. */
127 1.1 dholland if (ip->i_dirhash == NULL) {
128 1.3 dholland if (ip->i_size < (ulfs_dirhashminblks * dirblksiz) || OFSFMT(ip))
129 1.1 dholland return (-1);
130 1.1 dholland } else {
131 1.1 dholland /* Hash exists, but sysctls could have changed. */
132 1.3 dholland if (ip->i_size < (ulfs_dirhashminblks * dirblksiz) ||
133 1.3 dholland ulfs_dirhashmem > ulfs_dirhashmaxmem) {
134 1.3 dholland ulfsdirhash_free(ip);
135 1.1 dholland return (-1);
136 1.1 dholland }
137 1.1 dholland /* Check if hash exists and is intact (note: unlocked read). */
138 1.1 dholland if (ip->i_dirhash->dh_hash != NULL)
139 1.1 dholland return (0);
140 1.1 dholland /* Free the old, recycled hash and build a new one. */
141 1.3 dholland ulfsdirhash_free(ip);
142 1.1 dholland }
143 1.1 dholland
144 1.1 dholland /* Don't hash removed directories. */
145 1.1 dholland if (ip->i_nlink == 0)
146 1.1 dholland return (-1);
147 1.1 dholland
148 1.1 dholland vp = ip->i_vnode;
149 1.1 dholland /* Allocate 50% more entries than this dir size could ever need. */
150 1.1 dholland KASSERT(ip->i_size >= dirblksiz);
151 1.13 dholland nslots = ip->i_size / LFS_DIRECTSIZ(fs, 1);
152 1.1 dholland nslots = (nslots * 3 + 1) / 2;
153 1.1 dholland narrays = howmany(nslots, DH_NBLKOFF);
154 1.1 dholland nslots = narrays * DH_NBLKOFF;
155 1.1 dholland dirblocks = howmany(ip->i_size, dirblksiz);
156 1.1 dholland nblocks = (dirblocks * 3 + 1) / 2;
157 1.1 dholland
158 1.1 dholland memreqd = sizeof(*dh) + narrays * sizeof(*dh->dh_hash) +
159 1.1 dholland narrays * DH_NBLKOFF * sizeof(**dh->dh_hash) +
160 1.1 dholland nblocks * sizeof(*dh->dh_blkfree);
161 1.1 dholland
162 1.3 dholland while (atomic_add_int_nv(&ulfs_dirhashmem, memreqd) >
163 1.3 dholland ulfs_dirhashmaxmem) {
164 1.3 dholland atomic_add_int(&ulfs_dirhashmem, -memreqd);
165 1.3 dholland if (memreqd > ulfs_dirhashmaxmem / 2)
166 1.1 dholland return (-1);
167 1.1 dholland /* Try to free some space. */
168 1.3 dholland if (ulfsdirhash_recycle(memreqd) != 0)
169 1.1 dholland return (-1);
170 1.1 dholland else
171 1.1 dholland DIRHASHLIST_UNLOCK();
172 1.1 dholland }
173 1.1 dholland
174 1.1 dholland /*
175 1.1 dholland * Use non-blocking mallocs so that we will revert to a linear
176 1.1 dholland * lookup on failure rather than potentially blocking forever.
177 1.1 dholland */
178 1.3 dholland dh = pool_cache_get(ulfsdirhash_cache, PR_NOWAIT);
179 1.1 dholland if (dh == NULL) {
180 1.3 dholland atomic_add_int(&ulfs_dirhashmem, -memreqd);
181 1.1 dholland return (-1);
182 1.1 dholland }
183 1.1 dholland memset(dh, 0, sizeof(*dh));
184 1.1 dholland mutex_init(&dh->dh_lock, MUTEX_DEFAULT, IPL_NONE);
185 1.1 dholland DIRHASH_LOCK(dh);
186 1.1 dholland dh->dh_hashsz = narrays * sizeof(dh->dh_hash[0]);
187 1.1 dholland dh->dh_hash = kmem_zalloc(dh->dh_hashsz, KM_NOSLEEP);
188 1.1 dholland dh->dh_blkfreesz = nblocks * sizeof(dh->dh_blkfree[0]);
189 1.1 dholland dh->dh_blkfree = kmem_zalloc(dh->dh_blkfreesz, KM_NOSLEEP);
190 1.1 dholland if (dh->dh_hash == NULL || dh->dh_blkfree == NULL)
191 1.1 dholland goto fail;
192 1.1 dholland for (i = 0; i < narrays; i++) {
193 1.1 dholland if ((dh->dh_hash[i] = DIRHASH_BLKALLOC()) == NULL)
194 1.1 dholland goto fail;
195 1.1 dholland for (j = 0; j < DH_NBLKOFF; j++)
196 1.1 dholland dh->dh_hash[i][j] = DIRHASH_EMPTY;
197 1.1 dholland }
198 1.1 dholland
199 1.1 dholland /* Initialise the hash table and block statistics. */
200 1.1 dholland dh->dh_narrays = narrays;
201 1.1 dholland dh->dh_hlen = nslots;
202 1.1 dholland dh->dh_nblk = nblocks;
203 1.1 dholland dh->dh_dirblks = dirblocks;
204 1.1 dholland for (i = 0; i < dirblocks; i++)
205 1.1 dholland dh->dh_blkfree[i] = dirblksiz / DIRALIGN;
206 1.1 dholland for (i = 0; i < DH_NFSTATS; i++)
207 1.1 dholland dh->dh_firstfree[i] = -1;
208 1.1 dholland dh->dh_firstfree[DH_NFSTATS] = 0;
209 1.1 dholland dh->dh_seqopt = 0;
210 1.1 dholland dh->dh_seqoff = 0;
211 1.1 dholland dh->dh_score = DH_SCOREINIT;
212 1.1 dholland ip->i_dirhash = dh;
213 1.1 dholland
214 1.3 dholland bmask = VFSTOULFS(vp->v_mount)->um_mountp->mnt_stat.f_iosize - 1;
215 1.1 dholland pos = 0;
216 1.1 dholland while (pos < ip->i_size) {
217 1.1 dholland if ((curcpu()->ci_schedstate.spc_flags & SPCF_SHOULDYIELD)
218 1.1 dholland != 0) {
219 1.1 dholland preempt();
220 1.1 dholland }
221 1.1 dholland /* If necessary, get the next directory block. */
222 1.1 dholland if ((pos & bmask) == 0) {
223 1.1 dholland if (bp != NULL)
224 1.1 dholland brelse(bp, 0);
225 1.3 dholland if (ulfs_blkatoff(vp, (off_t)pos, NULL, &bp, false) != 0)
226 1.1 dholland goto fail;
227 1.1 dholland }
228 1.1 dholland
229 1.1 dholland /* Add this entry to the hash. */
230 1.14 dholland ep = (LFS_DIRHEADER *)((char *)bp->b_data + (pos & bmask));
231 1.10 dholland if (lfs_dir_getreclen(fs, ep) == 0 || lfs_dir_getreclen(fs, ep) >
232 1.1 dholland dirblksiz - (pos & (dirblksiz - 1))) {
233 1.1 dholland /* Corrupted directory. */
234 1.1 dholland brelse(bp, 0);
235 1.1 dholland goto fail;
236 1.1 dholland }
237 1.10 dholland if (lfs_dir_getino(fs, ep) != 0) {
238 1.3 dholland /* Add the entry (simplified ulfsdirhash_add). */
239 1.11 dholland slot = ulfsdirhash_hash(dh, lfs_dir_nameptr(fs, ep),
240 1.9 dholland lfs_dir_getnamlen(fs, ep));
241 1.1 dholland while (DH_ENTRY(dh, slot) != DIRHASH_EMPTY)
242 1.1 dholland slot = WRAPINCR(slot, dh->dh_hlen);
243 1.1 dholland dh->dh_hused++;
244 1.1 dholland DH_ENTRY(dh, slot) = pos;
245 1.9 dholland ulfsdirhash_adjfree(dh, pos, -LFS_DIRSIZ(fs, ep),
246 1.1 dholland dirblksiz);
247 1.1 dholland }
248 1.10 dholland pos += lfs_dir_getreclen(fs, ep);
249 1.1 dholland }
250 1.1 dholland
251 1.1 dholland if (bp != NULL)
252 1.1 dholland brelse(bp, 0);
253 1.1 dholland DIRHASHLIST_LOCK();
254 1.3 dholland TAILQ_INSERT_TAIL(&ulfsdirhash_list, dh, dh_list);
255 1.1 dholland dh->dh_onlist = 1;
256 1.1 dholland DIRHASH_UNLOCK(dh);
257 1.1 dholland DIRHASHLIST_UNLOCK();
258 1.1 dholland return (0);
259 1.1 dholland
260 1.1 dholland fail:
261 1.17 dholland ip->i_dirhash = NULL;
262 1.1 dholland DIRHASH_UNLOCK(dh);
263 1.1 dholland if (dh->dh_hash != NULL) {
264 1.1 dholland for (i = 0; i < narrays; i++)
265 1.1 dholland if (dh->dh_hash[i] != NULL)
266 1.1 dholland DIRHASH_BLKFREE(dh->dh_hash[i]);
267 1.1 dholland kmem_free(dh->dh_hash, dh->dh_hashsz);
268 1.1 dholland }
269 1.1 dholland if (dh->dh_blkfree != NULL)
270 1.1 dholland kmem_free(dh->dh_blkfree, dh->dh_blkfreesz);
271 1.1 dholland mutex_destroy(&dh->dh_lock);
272 1.3 dholland pool_cache_put(ulfsdirhash_cache, dh);
273 1.3 dholland atomic_add_int(&ulfs_dirhashmem, -memreqd);
274 1.1 dholland return (-1);
275 1.1 dholland }
276 1.1 dholland
277 1.1 dholland /*
278 1.1 dholland * Free any hash table associated with inode 'ip'.
279 1.1 dholland */
280 1.1 dholland void
281 1.3 dholland ulfsdirhash_free(struct inode *ip)
282 1.1 dholland {
283 1.1 dholland struct dirhash *dh;
284 1.1 dholland int i, mem;
285 1.1 dholland
286 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
287 1.1 dholland return;
288 1.1 dholland
289 1.17 dholland ip->i_dirhash = NULL;
290 1.17 dholland
291 1.1 dholland if (dh->dh_onlist) {
292 1.1 dholland DIRHASHLIST_LOCK();
293 1.1 dholland if (dh->dh_onlist)
294 1.3 dholland TAILQ_REMOVE(&ulfsdirhash_list, dh, dh_list);
295 1.1 dholland DIRHASHLIST_UNLOCK();
296 1.1 dholland }
297 1.1 dholland
298 1.1 dholland /* The dirhash pointed to by 'dh' is exclusively ours now. */
299 1.1 dholland mem = sizeof(*dh);
300 1.1 dholland if (dh->dh_hash != NULL) {
301 1.1 dholland for (i = 0; i < dh->dh_narrays; i++)
302 1.1 dholland DIRHASH_BLKFREE(dh->dh_hash[i]);
303 1.1 dholland kmem_free(dh->dh_hash, dh->dh_hashsz);
304 1.1 dholland kmem_free(dh->dh_blkfree, dh->dh_blkfreesz);
305 1.1 dholland mem += dh->dh_hashsz;
306 1.1 dholland mem += dh->dh_narrays * DH_NBLKOFF * sizeof(**dh->dh_hash);
307 1.1 dholland mem += dh->dh_nblk * sizeof(*dh->dh_blkfree);
308 1.1 dholland }
309 1.1 dholland mutex_destroy(&dh->dh_lock);
310 1.3 dholland pool_cache_put(ulfsdirhash_cache, dh);
311 1.1 dholland
312 1.3 dholland atomic_add_int(&ulfs_dirhashmem, -mem);
313 1.1 dholland }
314 1.1 dholland
315 1.1 dholland /*
316 1.1 dholland * Find the offset of the specified name within the given inode.
317 1.1 dholland * Returns 0 on success, ENOENT if the entry does not exist, or
318 1.1 dholland * EJUSTRETURN if the caller should revert to a linear search.
319 1.1 dholland *
320 1.1 dholland * If successful, the directory offset is stored in *offp, and a
321 1.1 dholland * pointer to a struct buf containing the entry is stored in *bpp. If
322 1.1 dholland * prevoffp is non-NULL, the offset of the previous entry within
323 1.1 dholland * the DIRBLKSIZ-sized block is stored in *prevoffp (if the entry
324 1.1 dholland * is the first in a block, the start of the block is used).
325 1.1 dholland */
326 1.1 dholland int
327 1.3 dholland ulfsdirhash_lookup(struct inode *ip, const char *name, int namelen, doff_t *offp,
328 1.1 dholland struct buf **bpp, doff_t *prevoffp)
329 1.1 dholland {
330 1.9 dholland struct lfs *fs = ip->i_lfs;
331 1.1 dholland struct dirhash *dh, *dh_next;
332 1.14 dholland LFS_DIRHEADER *dp;
333 1.1 dholland struct vnode *vp;
334 1.1 dholland struct buf *bp;
335 1.1 dholland doff_t blkoff, bmask, offset, prevoff;
336 1.1 dholland int i, slot;
337 1.7 dholland int dirblksiz = ip->i_lfs->um_dirblksiz;
338 1.1 dholland
339 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
340 1.1 dholland return (EJUSTRETURN);
341 1.1 dholland
342 1.1 dholland /*
343 1.1 dholland * Move this dirhash towards the end of the list if it has a
344 1.1 dholland * score higher than the next entry, and acquire the dh_lock.
345 1.1 dholland * Optimise the case where it's already the last by performing
346 1.1 dholland * an unlocked read of the TAILQ_NEXT pointer.
347 1.1 dholland *
348 1.1 dholland * In both cases, end up holding just dh_lock.
349 1.1 dholland */
350 1.1 dholland if (TAILQ_NEXT(dh, dh_list) != NULL) {
351 1.1 dholland DIRHASHLIST_LOCK();
352 1.1 dholland DIRHASH_LOCK(dh);
353 1.1 dholland /*
354 1.1 dholland * If the new score will be greater than that of the next
355 1.1 dholland * entry, then move this entry past it. With both mutexes
356 1.1 dholland * held, dh_next won't go away, but its dh_score could
357 1.1 dholland * change; that's not important since it is just a hint.
358 1.1 dholland */
359 1.1 dholland if (dh->dh_hash != NULL &&
360 1.1 dholland (dh_next = TAILQ_NEXT(dh, dh_list)) != NULL &&
361 1.1 dholland dh->dh_score >= dh_next->dh_score) {
362 1.1 dholland KASSERT(dh->dh_onlist);
363 1.3 dholland TAILQ_REMOVE(&ulfsdirhash_list, dh, dh_list);
364 1.3 dholland TAILQ_INSERT_AFTER(&ulfsdirhash_list, dh_next, dh,
365 1.1 dholland dh_list);
366 1.1 dholland }
367 1.1 dholland DIRHASHLIST_UNLOCK();
368 1.1 dholland } else {
369 1.1 dholland /* Already the last, though that could change as we wait. */
370 1.1 dholland DIRHASH_LOCK(dh);
371 1.1 dholland }
372 1.1 dholland if (dh->dh_hash == NULL) {
373 1.1 dholland DIRHASH_UNLOCK(dh);
374 1.3 dholland ulfsdirhash_free(ip);
375 1.1 dholland return (EJUSTRETURN);
376 1.1 dholland }
377 1.1 dholland
378 1.1 dholland /* Update the score. */
379 1.1 dholland if (dh->dh_score < DH_SCOREMAX)
380 1.1 dholland dh->dh_score++;
381 1.1 dholland
382 1.1 dholland vp = ip->i_vnode;
383 1.3 dholland bmask = VFSTOULFS(vp->v_mount)->um_mountp->mnt_stat.f_iosize - 1;
384 1.1 dholland blkoff = -1;
385 1.1 dholland bp = NULL;
386 1.1 dholland restart:
387 1.3 dholland slot = ulfsdirhash_hash(dh, name, namelen);
388 1.1 dholland
389 1.1 dholland if (dh->dh_seqopt) {
390 1.1 dholland /*
391 1.1 dholland * Sequential access optimisation. dh_seqoff contains the
392 1.1 dholland * offset of the directory entry immediately following
393 1.1 dholland * the last entry that was looked up. Check if this offset
394 1.1 dholland * appears in the hash chain for the name we are looking for.
395 1.1 dholland */
396 1.1 dholland for (i = slot; (offset = DH_ENTRY(dh, i)) != DIRHASH_EMPTY;
397 1.1 dholland i = WRAPINCR(i, dh->dh_hlen))
398 1.1 dholland if (offset == dh->dh_seqoff)
399 1.1 dholland break;
400 1.1 dholland if (offset == dh->dh_seqoff) {
401 1.1 dholland /*
402 1.1 dholland * We found an entry with the expected offset. This
403 1.1 dholland * is probably the entry we want, but if not, the
404 1.1 dholland * code below will turn off seqoff and retry.
405 1.1 dholland */
406 1.1 dholland slot = i;
407 1.1 dholland } else
408 1.1 dholland dh->dh_seqopt = 0;
409 1.1 dholland }
410 1.1 dholland
411 1.1 dholland for (; (offset = DH_ENTRY(dh, slot)) != DIRHASH_EMPTY;
412 1.1 dholland slot = WRAPINCR(slot, dh->dh_hlen)) {
413 1.1 dholland if (offset == DIRHASH_DEL)
414 1.1 dholland continue;
415 1.1 dholland
416 1.1 dholland if (offset < 0 || offset >= ip->i_size)
417 1.3 dholland panic("ulfsdirhash_lookup: bad offset in hash array");
418 1.1 dholland if ((offset & ~bmask) != blkoff) {
419 1.1 dholland if (bp != NULL)
420 1.1 dholland brelse(bp, 0);
421 1.1 dholland blkoff = offset & ~bmask;
422 1.3 dholland if (ulfs_blkatoff(vp, (off_t)blkoff,
423 1.1 dholland NULL, &bp, false) != 0) {
424 1.1 dholland DIRHASH_UNLOCK(dh);
425 1.1 dholland return (EJUSTRETURN);
426 1.1 dholland }
427 1.1 dholland }
428 1.14 dholland dp = (LFS_DIRHEADER *)((char *)bp->b_data + (offset & bmask));
429 1.10 dholland if (lfs_dir_getreclen(fs, dp) == 0 || lfs_dir_getreclen(fs, dp) >
430 1.1 dholland dirblksiz - (offset & (dirblksiz - 1))) {
431 1.1 dholland /* Corrupted directory. */
432 1.1 dholland DIRHASH_UNLOCK(dh);
433 1.1 dholland brelse(bp, 0);
434 1.1 dholland return (EJUSTRETURN);
435 1.1 dholland }
436 1.9 dholland if (lfs_dir_getnamlen(fs, dp) == namelen &&
437 1.11 dholland memcmp(lfs_dir_nameptr(fs, dp), name, namelen) == 0) {
438 1.1 dholland /* Found. Get the prev offset if needed. */
439 1.1 dholland if (prevoffp != NULL) {
440 1.1 dholland if (offset & (dirblksiz - 1)) {
441 1.10 dholland prevoff = ulfsdirhash_getprev(fs, dp,
442 1.1 dholland offset, dirblksiz);
443 1.1 dholland if (prevoff == -1) {
444 1.1 dholland brelse(bp, 0);
445 1.1 dholland return (EJUSTRETURN);
446 1.1 dholland }
447 1.1 dholland } else
448 1.1 dholland prevoff = offset;
449 1.1 dholland *prevoffp = prevoff;
450 1.1 dholland }
451 1.1 dholland
452 1.1 dholland /* Check for sequential access, and update offset. */
453 1.1 dholland if (dh->dh_seqopt == 0 && dh->dh_seqoff == offset)
454 1.1 dholland dh->dh_seqopt = 1;
455 1.9 dholland dh->dh_seqoff = offset + LFS_DIRSIZ(fs, dp);
456 1.1 dholland DIRHASH_UNLOCK(dh);
457 1.1 dholland
458 1.1 dholland *bpp = bp;
459 1.1 dholland *offp = offset;
460 1.1 dholland return (0);
461 1.1 dholland }
462 1.1 dholland
463 1.1 dholland if (dh->dh_hash == NULL) {
464 1.1 dholland DIRHASH_UNLOCK(dh);
465 1.1 dholland if (bp != NULL)
466 1.1 dholland brelse(bp, 0);
467 1.3 dholland ulfsdirhash_free(ip);
468 1.1 dholland return (EJUSTRETURN);
469 1.1 dholland }
470 1.1 dholland /*
471 1.1 dholland * When the name doesn't match in the seqopt case, go back
472 1.1 dholland * and search normally.
473 1.1 dholland */
474 1.1 dholland if (dh->dh_seqopt) {
475 1.1 dholland dh->dh_seqopt = 0;
476 1.1 dholland goto restart;
477 1.1 dholland }
478 1.1 dholland }
479 1.1 dholland DIRHASH_UNLOCK(dh);
480 1.1 dholland if (bp != NULL)
481 1.1 dholland brelse(bp, 0);
482 1.1 dholland return (ENOENT);
483 1.1 dholland }
484 1.1 dholland
485 1.1 dholland /*
486 1.1 dholland * Find a directory block with room for 'slotneeded' bytes. Returns
487 1.1 dholland * the offset of the directory entry that begins the free space.
488 1.1 dholland * This will either be the offset of an existing entry that has free
489 1.1 dholland * space at the end, or the offset of an entry with d_ino == 0 at
490 1.1 dholland * the start of a DIRBLKSIZ block.
491 1.1 dholland *
492 1.1 dholland * To use the space, the caller may need to compact existing entries in
493 1.1 dholland * the directory. The total number of bytes in all of the entries involved
494 1.1 dholland * in the compaction is stored in *slotsize. In other words, all of
495 1.1 dholland * the entries that must be compacted are exactly contained in the
496 1.1 dholland * region beginning at the returned offset and spanning *slotsize bytes.
497 1.1 dholland *
498 1.1 dholland * Returns -1 if no space was found, indicating that the directory
499 1.1 dholland * must be extended.
500 1.1 dholland */
501 1.1 dholland doff_t
502 1.3 dholland ulfsdirhash_findfree(struct inode *ip, int slotneeded, int *slotsize)
503 1.1 dholland {
504 1.9 dholland struct lfs *fs = ip->i_lfs;
505 1.14 dholland LFS_DIRHEADER *dp;
506 1.1 dholland struct dirhash *dh;
507 1.1 dholland struct buf *bp;
508 1.1 dholland doff_t pos, slotstart;
509 1.1 dholland int dirblock, error, freebytes, i;
510 1.7 dholland int dirblksiz = ip->i_lfs->um_dirblksiz;
511 1.1 dholland
512 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
513 1.1 dholland return (-1);
514 1.1 dholland
515 1.1 dholland DIRHASH_LOCK(dh);
516 1.1 dholland if (dh->dh_hash == NULL) {
517 1.1 dholland DIRHASH_UNLOCK(dh);
518 1.3 dholland ulfsdirhash_free(ip);
519 1.1 dholland return (-1);
520 1.1 dholland }
521 1.1 dholland
522 1.1 dholland /* Find a directory block with the desired free space. */
523 1.1 dholland dirblock = -1;
524 1.1 dholland for (i = howmany(slotneeded, DIRALIGN); i <= DH_NFSTATS; i++)
525 1.1 dholland if ((dirblock = dh->dh_firstfree[i]) != -1)
526 1.1 dholland break;
527 1.1 dholland if (dirblock == -1) {
528 1.1 dholland DIRHASH_UNLOCK(dh);
529 1.1 dholland return (-1);
530 1.1 dholland }
531 1.1 dholland
532 1.1 dholland KASSERT(dirblock < dh->dh_nblk &&
533 1.1 dholland dh->dh_blkfree[dirblock] >= howmany(slotneeded, DIRALIGN));
534 1.1 dholland pos = dirblock * dirblksiz;
535 1.3 dholland error = ulfs_blkatoff(ip->i_vnode, (off_t)pos, (void *)&dp, &bp, false);
536 1.1 dholland if (error) {
537 1.1 dholland DIRHASH_UNLOCK(dh);
538 1.1 dholland return (-1);
539 1.1 dholland }
540 1.1 dholland /* Find the first entry with free space. */
541 1.1 dholland for (i = 0; i < dirblksiz; ) {
542 1.10 dholland if (lfs_dir_getreclen(fs, dp) == 0) {
543 1.1 dholland DIRHASH_UNLOCK(dh);
544 1.1 dholland brelse(bp, 0);
545 1.1 dholland return (-1);
546 1.1 dholland }
547 1.10 dholland if (lfs_dir_getino(fs, dp) == 0 || lfs_dir_getreclen(fs, dp) > LFS_DIRSIZ(fs, dp))
548 1.1 dholland break;
549 1.10 dholland i += lfs_dir_getreclen(fs, dp);
550 1.10 dholland dp = LFS_NEXTDIR(fs, dp);
551 1.1 dholland }
552 1.1 dholland if (i > dirblksiz) {
553 1.1 dholland DIRHASH_UNLOCK(dh);
554 1.1 dholland brelse(bp, 0);
555 1.1 dholland return (-1);
556 1.1 dholland }
557 1.1 dholland slotstart = pos + i;
558 1.1 dholland
559 1.1 dholland /* Find the range of entries needed to get enough space */
560 1.1 dholland freebytes = 0;
561 1.1 dholland while (i < dirblksiz && freebytes < slotneeded) {
562 1.10 dholland freebytes += lfs_dir_getreclen(fs, dp);
563 1.10 dholland if (lfs_dir_getino(fs, dp) != 0)
564 1.9 dholland freebytes -= LFS_DIRSIZ(fs, dp);
565 1.10 dholland if (lfs_dir_getreclen(fs, dp) == 0) {
566 1.1 dholland DIRHASH_UNLOCK(dh);
567 1.1 dholland brelse(bp, 0);
568 1.1 dholland return (-1);
569 1.1 dholland }
570 1.10 dholland i += lfs_dir_getreclen(fs, dp);
571 1.10 dholland dp = LFS_NEXTDIR(fs, dp);
572 1.1 dholland }
573 1.1 dholland if (i > dirblksiz) {
574 1.1 dholland DIRHASH_UNLOCK(dh);
575 1.1 dholland brelse(bp, 0);
576 1.1 dholland return (-1);
577 1.1 dholland }
578 1.1 dholland if (freebytes < slotneeded)
579 1.3 dholland panic("ulfsdirhash_findfree: free mismatch");
580 1.1 dholland DIRHASH_UNLOCK(dh);
581 1.1 dholland brelse(bp, 0);
582 1.1 dholland *slotsize = pos + i - slotstart;
583 1.1 dholland return (slotstart);
584 1.1 dholland }
585 1.1 dholland
586 1.1 dholland /*
587 1.1 dholland * Return the start of the unused space at the end of a directory, or
588 1.1 dholland * -1 if there are no trailing unused blocks.
589 1.1 dholland */
590 1.1 dholland doff_t
591 1.3 dholland ulfsdirhash_enduseful(struct inode *ip)
592 1.1 dholland {
593 1.1 dholland struct dirhash *dh;
594 1.1 dholland int i;
595 1.7 dholland int dirblksiz = ip->i_lfs->um_dirblksiz;
596 1.1 dholland
597 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
598 1.1 dholland return (-1);
599 1.1 dholland
600 1.1 dholland DIRHASH_LOCK(dh);
601 1.1 dholland if (dh->dh_hash == NULL) {
602 1.1 dholland DIRHASH_UNLOCK(dh);
603 1.3 dholland ulfsdirhash_free(ip);
604 1.1 dholland return (-1);
605 1.1 dholland }
606 1.1 dholland
607 1.1 dholland if (dh->dh_blkfree[dh->dh_dirblks - 1] != dirblksiz / DIRALIGN) {
608 1.1 dholland DIRHASH_UNLOCK(dh);
609 1.1 dholland return (-1);
610 1.1 dholland }
611 1.1 dholland
612 1.1 dholland for (i = dh->dh_dirblks - 1; i >= 0; i--)
613 1.1 dholland if (dh->dh_blkfree[i] != dirblksiz / DIRALIGN)
614 1.1 dholland break;
615 1.1 dholland DIRHASH_UNLOCK(dh);
616 1.1 dholland return ((doff_t)(i + 1) * dirblksiz);
617 1.1 dholland }
618 1.1 dholland
619 1.1 dholland /*
620 1.1 dholland * Insert information into the hash about a new directory entry. dirp
621 1.4 dholland * points to a struct lfs_direct containing the entry, and offset specifies
622 1.1 dholland * the offset of this entry.
623 1.1 dholland */
624 1.1 dholland void
625 1.14 dholland ulfsdirhash_add(struct inode *ip, LFS_DIRHEADER *dirp, doff_t offset)
626 1.1 dholland {
627 1.9 dholland struct lfs *fs = ip->i_lfs;
628 1.1 dholland struct dirhash *dh;
629 1.1 dholland int slot;
630 1.7 dholland int dirblksiz = ip->i_lfs->um_dirblksiz;
631 1.1 dholland
632 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
633 1.1 dholland return;
634 1.1 dholland
635 1.1 dholland DIRHASH_LOCK(dh);
636 1.1 dholland if (dh->dh_hash == NULL) {
637 1.1 dholland DIRHASH_UNLOCK(dh);
638 1.3 dholland ulfsdirhash_free(ip);
639 1.1 dholland return;
640 1.1 dholland }
641 1.1 dholland
642 1.1 dholland KASSERT(offset < dh->dh_dirblks * dirblksiz);
643 1.1 dholland /*
644 1.1 dholland * Normal hash usage is < 66%. If the usage gets too high then
645 1.1 dholland * remove the hash entirely and let it be rebuilt later.
646 1.1 dholland */
647 1.1 dholland if (dh->dh_hused >= (dh->dh_hlen * 3) / 4) {
648 1.1 dholland DIRHASH_UNLOCK(dh);
649 1.3 dholland ulfsdirhash_free(ip);
650 1.1 dholland return;
651 1.1 dholland }
652 1.1 dholland
653 1.1 dholland /* Find a free hash slot (empty or deleted), and add the entry. */
654 1.11 dholland slot = ulfsdirhash_hash(dh, lfs_dir_nameptr(fs, dirp),
655 1.11 dholland lfs_dir_getnamlen(fs, dirp));
656 1.1 dholland while (DH_ENTRY(dh, slot) >= 0)
657 1.1 dholland slot = WRAPINCR(slot, dh->dh_hlen);
658 1.1 dholland if (DH_ENTRY(dh, slot) == DIRHASH_EMPTY)
659 1.1 dholland dh->dh_hused++;
660 1.1 dholland DH_ENTRY(dh, slot) = offset;
661 1.1 dholland
662 1.1 dholland /* Update the per-block summary info. */
663 1.9 dholland ulfsdirhash_adjfree(dh, offset, -LFS_DIRSIZ(fs, dirp), dirblksiz);
664 1.1 dholland DIRHASH_UNLOCK(dh);
665 1.1 dholland }
666 1.1 dholland
667 1.1 dholland /*
668 1.1 dholland * Remove the specified directory entry from the hash. The entry to remove
669 1.1 dholland * is defined by the name in `dirp', which must exist at the specified
670 1.1 dholland * `offset' within the directory.
671 1.1 dholland */
672 1.1 dholland void
673 1.14 dholland ulfsdirhash_remove(struct inode *ip, LFS_DIRHEADER *dirp, doff_t offset)
674 1.1 dholland {
675 1.9 dholland struct lfs *fs = ip->i_lfs;
676 1.1 dholland struct dirhash *dh;
677 1.1 dholland int slot;
678 1.7 dholland int dirblksiz = ip->i_lfs->um_dirblksiz;
679 1.1 dholland
680 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
681 1.1 dholland return;
682 1.1 dholland
683 1.1 dholland DIRHASH_LOCK(dh);
684 1.1 dholland if (dh->dh_hash == NULL) {
685 1.1 dholland DIRHASH_UNLOCK(dh);
686 1.3 dholland ulfsdirhash_free(ip);
687 1.1 dholland return;
688 1.1 dholland }
689 1.1 dholland
690 1.1 dholland KASSERT(offset < dh->dh_dirblks * dirblksiz);
691 1.1 dholland /* Find the entry */
692 1.11 dholland slot = ulfsdirhash_findslot(dh, lfs_dir_nameptr(fs, dirp),
693 1.9 dholland lfs_dir_getnamlen(fs, dirp), offset);
694 1.1 dholland
695 1.1 dholland /* Remove the hash entry. */
696 1.3 dholland ulfsdirhash_delslot(dh, slot);
697 1.1 dholland
698 1.1 dholland /* Update the per-block summary info. */
699 1.9 dholland ulfsdirhash_adjfree(dh, offset, LFS_DIRSIZ(fs, dirp), dirblksiz);
700 1.1 dholland DIRHASH_UNLOCK(dh);
701 1.1 dholland }
702 1.1 dholland
703 1.1 dholland /*
704 1.1 dholland * Change the offset associated with a directory entry in the hash. Used
705 1.1 dholland * when compacting directory blocks.
706 1.1 dholland */
707 1.1 dholland void
708 1.14 dholland ulfsdirhash_move(struct inode *ip, LFS_DIRHEADER *dirp, doff_t oldoff,
709 1.1 dholland doff_t newoff)
710 1.1 dholland {
711 1.9 dholland struct lfs *fs = ip->i_lfs;
712 1.1 dholland struct dirhash *dh;
713 1.1 dholland int slot;
714 1.1 dholland
715 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
716 1.1 dholland return;
717 1.1 dholland DIRHASH_LOCK(dh);
718 1.1 dholland if (dh->dh_hash == NULL) {
719 1.1 dholland DIRHASH_UNLOCK(dh);
720 1.3 dholland ulfsdirhash_free(ip);
721 1.1 dholland return;
722 1.1 dholland }
723 1.1 dholland
724 1.7 dholland KASSERT(oldoff < dh->dh_dirblks * ip->i_lfs->um_dirblksiz &&
725 1.7 dholland newoff < dh->dh_dirblks * ip->i_lfs->um_dirblksiz);
726 1.1 dholland /* Find the entry, and update the offset. */
727 1.11 dholland slot = ulfsdirhash_findslot(dh, lfs_dir_nameptr(fs, dirp),
728 1.9 dholland lfs_dir_getnamlen(fs, dirp), oldoff);
729 1.1 dholland DH_ENTRY(dh, slot) = newoff;
730 1.1 dholland DIRHASH_UNLOCK(dh);
731 1.1 dholland }
732 1.1 dholland
733 1.1 dholland /*
734 1.1 dholland * Inform dirhash that the directory has grown by one block that
735 1.1 dholland * begins at offset (i.e. the new length is offset + DIRBLKSIZ).
736 1.1 dholland */
737 1.1 dholland void
738 1.3 dholland ulfsdirhash_newblk(struct inode *ip, doff_t offset)
739 1.1 dholland {
740 1.1 dholland struct dirhash *dh;
741 1.1 dholland int block;
742 1.7 dholland int dirblksiz = ip->i_lfs->um_dirblksiz;
743 1.1 dholland
744 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
745 1.1 dholland return;
746 1.1 dholland DIRHASH_LOCK(dh);
747 1.1 dholland if (dh->dh_hash == NULL) {
748 1.1 dholland DIRHASH_UNLOCK(dh);
749 1.3 dholland ulfsdirhash_free(ip);
750 1.1 dholland return;
751 1.1 dholland }
752 1.1 dholland
753 1.1 dholland KASSERT(offset == dh->dh_dirblks * dirblksiz);
754 1.1 dholland block = offset / dirblksiz;
755 1.1 dholland if (block >= dh->dh_nblk) {
756 1.1 dholland /* Out of space; must rebuild. */
757 1.1 dholland DIRHASH_UNLOCK(dh);
758 1.3 dholland ulfsdirhash_free(ip);
759 1.1 dholland return;
760 1.1 dholland }
761 1.1 dholland dh->dh_dirblks = block + 1;
762 1.1 dholland
763 1.1 dholland /* Account for the new free block. */
764 1.1 dholland dh->dh_blkfree[block] = dirblksiz / DIRALIGN;
765 1.1 dholland if (dh->dh_firstfree[DH_NFSTATS] == -1)
766 1.1 dholland dh->dh_firstfree[DH_NFSTATS] = block;
767 1.1 dholland DIRHASH_UNLOCK(dh);
768 1.1 dholland }
769 1.1 dholland
770 1.1 dholland /*
771 1.1 dholland * Inform dirhash that the directory is being truncated.
772 1.1 dholland */
773 1.1 dholland void
774 1.3 dholland ulfsdirhash_dirtrunc(struct inode *ip, doff_t offset)
775 1.1 dholland {
776 1.1 dholland struct dirhash *dh;
777 1.1 dholland int block, i;
778 1.7 dholland int dirblksiz = ip->i_lfs->um_dirblksiz;
779 1.1 dholland
780 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
781 1.1 dholland return;
782 1.1 dholland
783 1.1 dholland DIRHASH_LOCK(dh);
784 1.1 dholland if (dh->dh_hash == NULL) {
785 1.1 dholland DIRHASH_UNLOCK(dh);
786 1.3 dholland ulfsdirhash_free(ip);
787 1.1 dholland return;
788 1.1 dholland }
789 1.1 dholland
790 1.1 dholland KASSERT(offset <= dh->dh_dirblks * dirblksiz);
791 1.1 dholland block = howmany(offset, dirblksiz);
792 1.1 dholland /*
793 1.1 dholland * If the directory shrinks to less than 1/8 of dh_nblk blocks
794 1.1 dholland * (about 20% of its original size due to the 50% extra added in
795 1.3 dholland * ulfsdirhash_build) then free it, and let the caller rebuild
796 1.1 dholland * if necessary.
797 1.1 dholland */
798 1.1 dholland if (block < dh->dh_nblk / 8 && dh->dh_narrays > 1) {
799 1.1 dholland DIRHASH_UNLOCK(dh);
800 1.3 dholland ulfsdirhash_free(ip);
801 1.1 dholland return;
802 1.1 dholland }
803 1.1 dholland
804 1.1 dholland /*
805 1.1 dholland * Remove any `first free' information pertaining to the
806 1.1 dholland * truncated blocks. All blocks we're removing should be
807 1.1 dholland * completely unused.
808 1.1 dholland */
809 1.1 dholland if (dh->dh_firstfree[DH_NFSTATS] >= block)
810 1.1 dholland dh->dh_firstfree[DH_NFSTATS] = -1;
811 1.1 dholland for (i = block; i < dh->dh_dirblks; i++)
812 1.1 dholland if (dh->dh_blkfree[i] != dirblksiz / DIRALIGN)
813 1.3 dholland panic("ulfsdirhash_dirtrunc: blocks in use");
814 1.1 dholland for (i = 0; i < DH_NFSTATS; i++)
815 1.1 dholland if (dh->dh_firstfree[i] >= block)
816 1.3 dholland panic("ulfsdirhash_dirtrunc: first free corrupt");
817 1.1 dholland dh->dh_dirblks = block;
818 1.1 dholland DIRHASH_UNLOCK(dh);
819 1.1 dholland }
820 1.1 dholland
821 1.1 dholland /*
822 1.1 dholland * Debugging function to check that the dirhash information about
823 1.1 dholland * a directory block matches its actual contents. Panics if a mismatch
824 1.1 dholland * is detected.
825 1.1 dholland *
826 1.1 dholland * On entry, `sbuf' should point to the start of an in-core
827 1.1 dholland * DIRBLKSIZ-sized directory block, and `offset' should contain the
828 1.1 dholland * offset from the start of the directory of that block.
829 1.1 dholland */
830 1.1 dholland void
831 1.3 dholland ulfsdirhash_checkblock(struct inode *ip, char *sbuf, doff_t offset)
832 1.1 dholland {
833 1.9 dholland struct lfs *fs = ip->i_lfs;
834 1.1 dholland struct dirhash *dh;
835 1.14 dholland LFS_DIRHEADER *dp;
836 1.1 dholland int block, ffslot, i, nfree;
837 1.7 dholland int dirblksiz = ip->i_lfs->um_dirblksiz;
838 1.1 dholland
839 1.3 dholland if (!ulfs_dirhashcheck)
840 1.1 dholland return;
841 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
842 1.1 dholland return;
843 1.1 dholland
844 1.1 dholland DIRHASH_LOCK(dh);
845 1.1 dholland if (dh->dh_hash == NULL) {
846 1.1 dholland DIRHASH_UNLOCK(dh);
847 1.3 dholland ulfsdirhash_free(ip);
848 1.1 dholland return;
849 1.1 dholland }
850 1.1 dholland
851 1.1 dholland block = offset / dirblksiz;
852 1.1 dholland if ((offset & (dirblksiz - 1)) != 0 || block >= dh->dh_dirblks)
853 1.3 dholland panic("ulfsdirhash_checkblock: bad offset");
854 1.1 dholland
855 1.1 dholland nfree = 0;
856 1.10 dholland for (i = 0; i < dirblksiz; i += lfs_dir_getreclen(fs, dp)) {
857 1.14 dholland dp = (LFS_DIRHEADER *)(sbuf + i);
858 1.10 dholland if (lfs_dir_getreclen(fs, dp) == 0 || i + lfs_dir_getreclen(fs, dp) > dirblksiz)
859 1.3 dholland panic("ulfsdirhash_checkblock: bad dir");
860 1.1 dholland
861 1.10 dholland if (lfs_dir_getino(fs, dp) == 0) {
862 1.1 dholland #if 0
863 1.1 dholland /*
864 1.1 dholland * XXX entries with d_ino == 0 should only occur
865 1.1 dholland * at the start of a DIRBLKSIZ block. However the
866 1.3 dholland * ulfs code is tolerant of such entries at other
867 1.1 dholland * offsets, and fsck does not fix them.
868 1.1 dholland */
869 1.1 dholland if (i != 0)
870 1.3 dholland panic("ulfsdirhash_checkblock: bad dir inode");
871 1.1 dholland #endif
872 1.10 dholland nfree += lfs_dir_getreclen(fs, dp);
873 1.1 dholland continue;
874 1.1 dholland }
875 1.1 dholland
876 1.1 dholland /* Check that the entry exists (will panic if it doesn't). */
877 1.11 dholland ulfsdirhash_findslot(dh, lfs_dir_nameptr(fs, dp),
878 1.11 dholland lfs_dir_getnamlen(fs, dp),
879 1.9 dholland offset + i);
880 1.1 dholland
881 1.10 dholland nfree += lfs_dir_getreclen(fs, dp) - LFS_DIRSIZ(fs, dp);
882 1.1 dholland }
883 1.1 dholland if (i != dirblksiz)
884 1.3 dholland panic("ulfsdirhash_checkblock: bad dir end");
885 1.1 dholland
886 1.1 dholland if (dh->dh_blkfree[block] * DIRALIGN != nfree)
887 1.3 dholland panic("ulfsdirhash_checkblock: bad free count");
888 1.1 dholland
889 1.1 dholland ffslot = BLKFREE2IDX(nfree / DIRALIGN);
890 1.1 dholland for (i = 0; i <= DH_NFSTATS; i++)
891 1.1 dholland if (dh->dh_firstfree[i] == block && i != ffslot)
892 1.3 dholland panic("ulfsdirhash_checkblock: bad first-free");
893 1.1 dholland if (dh->dh_firstfree[ffslot] == -1)
894 1.3 dholland panic("ulfsdirhash_checkblock: missing first-free entry");
895 1.1 dholland DIRHASH_UNLOCK(dh);
896 1.1 dholland }
897 1.1 dholland
898 1.1 dholland /*
899 1.1 dholland * Hash the specified filename into a dirhash slot.
900 1.1 dholland */
901 1.1 dholland static int
902 1.3 dholland ulfsdirhash_hash(struct dirhash *dh, const char *name, int namelen)
903 1.1 dholland {
904 1.1 dholland u_int32_t hash;
905 1.1 dholland
906 1.1 dholland /*
907 1.1 dholland * We hash the name and then some other bit of data that is
908 1.1 dholland * invariant over the dirhash's lifetime. Otherwise names
909 1.1 dholland * differing only in the last byte are placed close to one
910 1.1 dholland * another in the table, which is bad for linear probing.
911 1.1 dholland */
912 1.1 dholland hash = hash32_buf(name, namelen, HASH32_BUF_INIT);
913 1.1 dholland hash = hash32_buf(&dh, sizeof(dh), hash);
914 1.1 dholland return (hash % dh->dh_hlen);
915 1.1 dholland }
916 1.1 dholland
917 1.1 dholland /*
918 1.1 dholland * Adjust the number of free bytes in the block containing `offset'
919 1.1 dholland * by the value specified by `diff'.
920 1.1 dholland *
921 1.1 dholland * The caller must ensure we have exclusive access to `dh'; normally
922 1.1 dholland * that means that dh_lock should be held, but this is also called
923 1.3 dholland * from ulfsdirhash_build() where exclusive access can be assumed.
924 1.1 dholland */
925 1.1 dholland static void
926 1.3 dholland ulfsdirhash_adjfree(struct dirhash *dh, doff_t offset, int diff, int dirblksiz)
927 1.1 dholland {
928 1.1 dholland int block, i, nfidx, ofidx;
929 1.1 dholland
930 1.1 dholland KASSERT(mutex_owned(&dh->dh_lock));
931 1.1 dholland
932 1.1 dholland /* Update the per-block summary info. */
933 1.1 dholland block = offset / dirblksiz;
934 1.1 dholland KASSERT(block < dh->dh_nblk && block < dh->dh_dirblks);
935 1.1 dholland ofidx = BLKFREE2IDX(dh->dh_blkfree[block]);
936 1.1 dholland dh->dh_blkfree[block] = (int)dh->dh_blkfree[block] + (diff / DIRALIGN);
937 1.1 dholland nfidx = BLKFREE2IDX(dh->dh_blkfree[block]);
938 1.1 dholland
939 1.1 dholland /* Update the `first free' list if necessary. */
940 1.1 dholland if (ofidx != nfidx) {
941 1.1 dholland /* If removing, scan forward for the next block. */
942 1.1 dholland if (dh->dh_firstfree[ofidx] == block) {
943 1.1 dholland for (i = block + 1; i < dh->dh_dirblks; i++)
944 1.1 dholland if (BLKFREE2IDX(dh->dh_blkfree[i]) == ofidx)
945 1.1 dholland break;
946 1.1 dholland dh->dh_firstfree[ofidx] = (i < dh->dh_dirblks) ? i : -1;
947 1.1 dholland }
948 1.1 dholland
949 1.1 dholland /* Make this the new `first free' if necessary */
950 1.1 dholland if (dh->dh_firstfree[nfidx] > block ||
951 1.1 dholland dh->dh_firstfree[nfidx] == -1)
952 1.1 dholland dh->dh_firstfree[nfidx] = block;
953 1.1 dholland }
954 1.1 dholland }
955 1.1 dholland
956 1.1 dholland /*
957 1.1 dholland * Find the specified name which should have the specified offset.
958 1.1 dholland * Returns a slot number, and panics on failure.
959 1.1 dholland *
960 1.1 dholland * `dh' must be locked on entry and remains so on return.
961 1.1 dholland */
962 1.1 dholland static int
963 1.3 dholland ulfsdirhash_findslot(struct dirhash *dh, const char *name, int namelen,
964 1.1 dholland doff_t offset)
965 1.1 dholland {
966 1.1 dholland int slot;
967 1.1 dholland
968 1.1 dholland KASSERT(mutex_owned(&dh->dh_lock));
969 1.1 dholland
970 1.1 dholland /* Find the entry. */
971 1.1 dholland KASSERT(dh->dh_hused < dh->dh_hlen);
972 1.3 dholland slot = ulfsdirhash_hash(dh, name, namelen);
973 1.1 dholland while (DH_ENTRY(dh, slot) != offset &&
974 1.1 dholland DH_ENTRY(dh, slot) != DIRHASH_EMPTY)
975 1.1 dholland slot = WRAPINCR(slot, dh->dh_hlen);
976 1.1 dholland if (DH_ENTRY(dh, slot) != offset)
977 1.3 dholland panic("ulfsdirhash_findslot: '%.*s' not found", namelen, name);
978 1.1 dholland
979 1.1 dholland return (slot);
980 1.1 dholland }
981 1.1 dholland
982 1.1 dholland /*
983 1.1 dholland * Remove the entry corresponding to the specified slot from the hash array.
984 1.1 dholland *
985 1.1 dholland * `dh' must be locked on entry and remains so on return.
986 1.1 dholland */
987 1.1 dholland static void
988 1.3 dholland ulfsdirhash_delslot(struct dirhash *dh, int slot)
989 1.1 dholland {
990 1.1 dholland int i;
991 1.1 dholland
992 1.1 dholland KASSERT(mutex_owned(&dh->dh_lock));
993 1.1 dholland
994 1.1 dholland /* Mark the entry as deleted. */
995 1.1 dholland DH_ENTRY(dh, slot) = DIRHASH_DEL;
996 1.1 dholland
997 1.1 dholland /* If this is the end of a chain of DIRHASH_DEL slots, remove them. */
998 1.1 dholland for (i = slot; DH_ENTRY(dh, i) == DIRHASH_DEL; )
999 1.1 dholland i = WRAPINCR(i, dh->dh_hlen);
1000 1.1 dholland if (DH_ENTRY(dh, i) == DIRHASH_EMPTY) {
1001 1.1 dholland i = WRAPDECR(i, dh->dh_hlen);
1002 1.1 dholland while (DH_ENTRY(dh, i) == DIRHASH_DEL) {
1003 1.1 dholland DH_ENTRY(dh, i) = DIRHASH_EMPTY;
1004 1.1 dholland dh->dh_hused--;
1005 1.1 dholland i = WRAPDECR(i, dh->dh_hlen);
1006 1.1 dholland }
1007 1.1 dholland KASSERT(dh->dh_hused >= 0);
1008 1.1 dholland }
1009 1.1 dholland }
1010 1.1 dholland
1011 1.1 dholland /*
1012 1.1 dholland * Given a directory entry and its offset, find the offset of the
1013 1.1 dholland * previous entry in the same DIRBLKSIZ-sized block. Returns an
1014 1.1 dholland * offset, or -1 if there is no previous entry in the block or some
1015 1.1 dholland * other problem occurred.
1016 1.1 dholland */
1017 1.1 dholland static doff_t
1018 1.14 dholland ulfsdirhash_getprev(struct lfs *fs, LFS_DIRHEADER *dirp,
1019 1.10 dholland doff_t offset, int dirblksiz)
1020 1.1 dholland {
1021 1.14 dholland LFS_DIRHEADER *dp;
1022 1.1 dholland char *blkbuf;
1023 1.1 dholland doff_t blkoff, prevoff;
1024 1.1 dholland int entrypos, i;
1025 1.10 dholland unsigned reclen;
1026 1.1 dholland
1027 1.1 dholland blkoff = offset & ~(dirblksiz - 1); /* offset of start of block */
1028 1.1 dholland entrypos = offset & (dirblksiz - 1); /* entry relative to block */
1029 1.1 dholland blkbuf = (char *)dirp - entrypos;
1030 1.1 dholland prevoff = blkoff;
1031 1.1 dholland
1032 1.1 dholland /* If `offset' is the start of a block, there is no previous entry. */
1033 1.1 dholland if (entrypos == 0)
1034 1.1 dholland return (-1);
1035 1.1 dholland
1036 1.1 dholland /* Scan from the start of the block until we get to the entry. */
1037 1.10 dholland for (i = 0; i < entrypos; i += reclen) {
1038 1.14 dholland dp = (LFS_DIRHEADER *)(blkbuf + i);
1039 1.10 dholland reclen = lfs_dir_getreclen(fs, dp);
1040 1.10 dholland if (reclen == 0 || i + reclen > entrypos)
1041 1.1 dholland return (-1); /* Corrupted directory. */
1042 1.1 dholland prevoff = blkoff + i;
1043 1.1 dholland }
1044 1.1 dholland return (prevoff);
1045 1.1 dholland }
1046 1.1 dholland
1047 1.1 dholland /*
1048 1.1 dholland * Try to free up `wanted' bytes by stealing memory from existing
1049 1.1 dholland * dirhashes. Returns zero with list locked if successful.
1050 1.1 dholland */
1051 1.1 dholland static int
1052 1.3 dholland ulfsdirhash_recycle(int wanted)
1053 1.1 dholland {
1054 1.1 dholland struct dirhash *dh;
1055 1.1 dholland doff_t **hash;
1056 1.1 dholland u_int8_t *blkfree;
1057 1.1 dholland int i, mem, narrays;
1058 1.1 dholland size_t hashsz, blkfreesz;
1059 1.1 dholland
1060 1.1 dholland DIRHASHLIST_LOCK();
1061 1.3 dholland while (wanted + ulfs_dirhashmem > ulfs_dirhashmaxmem) {
1062 1.1 dholland /* Find a dirhash, and lock it. */
1063 1.3 dholland if ((dh = TAILQ_FIRST(&ulfsdirhash_list)) == NULL) {
1064 1.1 dholland DIRHASHLIST_UNLOCK();
1065 1.1 dholland return (-1);
1066 1.1 dholland }
1067 1.1 dholland DIRHASH_LOCK(dh);
1068 1.1 dholland KASSERT(dh->dh_hash != NULL);
1069 1.1 dholland
1070 1.1 dholland /* Decrement the score; only recycle if it becomes zero. */
1071 1.1 dholland if (--dh->dh_score > 0) {
1072 1.1 dholland DIRHASH_UNLOCK(dh);
1073 1.1 dholland DIRHASHLIST_UNLOCK();
1074 1.1 dholland return (-1);
1075 1.1 dholland }
1076 1.1 dholland
1077 1.1 dholland /* Remove it from the list and detach its memory. */
1078 1.3 dholland TAILQ_REMOVE(&ulfsdirhash_list, dh, dh_list);
1079 1.1 dholland dh->dh_onlist = 0;
1080 1.1 dholland hash = dh->dh_hash;
1081 1.1 dholland hashsz = dh->dh_hashsz;
1082 1.1 dholland dh->dh_hash = NULL;
1083 1.1 dholland blkfree = dh->dh_blkfree;
1084 1.1 dholland blkfreesz = dh->dh_blkfreesz;
1085 1.1 dholland dh->dh_blkfree = NULL;
1086 1.1 dholland narrays = dh->dh_narrays;
1087 1.1 dholland mem = narrays * sizeof(*dh->dh_hash) +
1088 1.1 dholland narrays * DH_NBLKOFF * sizeof(**dh->dh_hash) +
1089 1.1 dholland dh->dh_nblk * sizeof(*dh->dh_blkfree);
1090 1.1 dholland
1091 1.1 dholland /* Unlock everything, free the detached memory. */
1092 1.1 dholland DIRHASH_UNLOCK(dh);
1093 1.1 dholland DIRHASHLIST_UNLOCK();
1094 1.1 dholland
1095 1.1 dholland for (i = 0; i < narrays; i++)
1096 1.1 dholland DIRHASH_BLKFREE(hash[i]);
1097 1.1 dholland kmem_free(hash, hashsz);
1098 1.1 dholland kmem_free(blkfree, blkfreesz);
1099 1.1 dholland
1100 1.1 dholland /* Account for the returned memory, and repeat if necessary. */
1101 1.1 dholland DIRHASHLIST_LOCK();
1102 1.3 dholland atomic_add_int(&ulfs_dirhashmem, -mem);
1103 1.1 dholland }
1104 1.1 dholland /* Success. */
1105 1.1 dholland return (0);
1106 1.1 dholland }
1107 1.1 dholland
1108 1.1 dholland static void
1109 1.3 dholland ulfsdirhash_sysctl_init(void)
1110 1.1 dholland {
1111 1.1 dholland const struct sysctlnode *rnode, *cnode;
1112 1.1 dholland
1113 1.3 dholland sysctl_createv(&ulfsdirhash_sysctl_log, 0, NULL, &rnode,
1114 1.1 dholland CTLFLAG_PERMANENT,
1115 1.3 dholland CTLTYPE_NODE, "ulfs",
1116 1.3 dholland SYSCTL_DESCR("ulfs"),
1117 1.1 dholland NULL, 0, NULL, 0,
1118 1.8 pooka CTL_VFS, CTL_CREATE, CTL_EOL);
1119 1.1 dholland
1120 1.3 dholland sysctl_createv(&ulfsdirhash_sysctl_log, 0, &rnode, &rnode,
1121 1.1 dholland CTLFLAG_PERMANENT,
1122 1.1 dholland CTLTYPE_NODE, "dirhash",
1123 1.1 dholland SYSCTL_DESCR("dirhash"),
1124 1.1 dholland NULL, 0, NULL, 0,
1125 1.1 dholland CTL_CREATE, CTL_EOL);
1126 1.1 dholland
1127 1.3 dholland sysctl_createv(&ulfsdirhash_sysctl_log, 0, &rnode, &cnode,
1128 1.1 dholland CTLFLAG_PERMANENT|CTLFLAG_READWRITE,
1129 1.1 dholland CTLTYPE_INT, "minblocks",
1130 1.1 dholland SYSCTL_DESCR("minimum hashed directory size in blocks"),
1131 1.3 dholland NULL, 0, &ulfs_dirhashminblks, 0,
1132 1.1 dholland CTL_CREATE, CTL_EOL);
1133 1.1 dholland
1134 1.3 dholland sysctl_createv(&ulfsdirhash_sysctl_log, 0, &rnode, &cnode,
1135 1.1 dholland CTLFLAG_PERMANENT|CTLFLAG_READWRITE,
1136 1.1 dholland CTLTYPE_INT, "maxmem",
1137 1.1 dholland SYSCTL_DESCR("maximum dirhash memory usage"),
1138 1.3 dholland NULL, 0, &ulfs_dirhashmaxmem, 0,
1139 1.1 dholland CTL_CREATE, CTL_EOL);
1140 1.1 dholland
1141 1.3 dholland sysctl_createv(&ulfsdirhash_sysctl_log, 0, &rnode, &cnode,
1142 1.1 dholland CTLFLAG_PERMANENT|CTLFLAG_READONLY,
1143 1.1 dholland CTLTYPE_INT, "memused",
1144 1.1 dholland SYSCTL_DESCR("current dirhash memory usage"),
1145 1.3 dholland NULL, 0, &ulfs_dirhashmem, 0,
1146 1.1 dholland CTL_CREATE, CTL_EOL);
1147 1.1 dholland
1148 1.3 dholland sysctl_createv(&ulfsdirhash_sysctl_log, 0, &rnode, &cnode,
1149 1.1 dholland CTLFLAG_PERMANENT|CTLFLAG_READWRITE,
1150 1.1 dholland CTLTYPE_INT, "docheck",
1151 1.1 dholland SYSCTL_DESCR("enable extra sanity checks"),
1152 1.3 dholland NULL, 0, &ulfs_dirhashcheck, 0,
1153 1.1 dholland CTL_CREATE, CTL_EOL);
1154 1.1 dholland }
1155 1.1 dholland
1156 1.1 dholland void
1157 1.3 dholland ulfsdirhash_init(void)
1158 1.1 dholland {
1159 1.1 dholland
1160 1.3 dholland mutex_init(&ulfsdirhash_lock, MUTEX_DEFAULT, IPL_NONE);
1161 1.3 dholland ulfsdirhashblk_cache = pool_cache_init(DH_NBLKOFF * sizeof(daddr_t), 0,
1162 1.1 dholland 0, 0, "dirhashblk", NULL, IPL_NONE, NULL, NULL, NULL);
1163 1.3 dholland ulfsdirhash_cache = pool_cache_init(sizeof(struct dirhash), 0,
1164 1.1 dholland 0, 0, "dirhash", NULL, IPL_NONE, NULL, NULL, NULL);
1165 1.3 dholland TAILQ_INIT(&ulfsdirhash_list);
1166 1.3 dholland ulfsdirhash_sysctl_init();
1167 1.1 dholland }
1168 1.1 dholland
1169 1.1 dholland void
1170 1.3 dholland ulfsdirhash_done(void)
1171 1.1 dholland {
1172 1.1 dholland
1173 1.3 dholland KASSERT(TAILQ_EMPTY(&ulfsdirhash_list));
1174 1.3 dholland pool_cache_destroy(ulfsdirhashblk_cache);
1175 1.3 dholland pool_cache_destroy(ulfsdirhash_cache);
1176 1.3 dholland mutex_destroy(&ulfsdirhash_lock);
1177 1.3 dholland sysctl_teardown(&ulfsdirhash_sysctl_log);
1178 1.1 dholland }
1179