ulfs_dirhash.c revision 1.8 1 1.8 pooka /* $NetBSD: ulfs_dirhash.c,v 1.8 2014/02/25 18:30:13 pooka Exp $ */
2 1.1 dholland /* from NetBSD: ufs_dirhash.c,v 1.34 2009/10/05 23:48:08 rmind Exp */
3 1.1 dholland
4 1.1 dholland /*
5 1.1 dholland * Copyright (c) 2001, 2002 Ian Dowse. All rights reserved.
6 1.1 dholland *
7 1.1 dholland * Redistribution and use in source and binary forms, with or without
8 1.1 dholland * modification, are permitted provided that the following conditions
9 1.1 dholland * are met:
10 1.1 dholland * 1. Redistributions of source code must retain the above copyright
11 1.1 dholland * notice, this list of conditions and the following disclaimer.
12 1.1 dholland * 2. Redistributions in binary form must reproduce the above copyright
13 1.1 dholland * notice, this list of conditions and the following disclaimer in the
14 1.1 dholland * documentation and/or other materials provided with the distribution.
15 1.1 dholland *
16 1.1 dholland * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
17 1.1 dholland * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18 1.1 dholland * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19 1.1 dholland * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
20 1.1 dholland * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21 1.1 dholland * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
22 1.1 dholland * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23 1.1 dholland * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
24 1.1 dholland * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25 1.1 dholland * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26 1.1 dholland * SUCH DAMAGE.
27 1.1 dholland *
28 1.1 dholland * $FreeBSD: src/sys/ufs/ufs/ufs_dirhash.c,v 1.3.2.8 2004/12/08 11:54:13 dwmalone Exp $
29 1.1 dholland */
30 1.1 dholland
31 1.1 dholland #include <sys/cdefs.h>
32 1.8 pooka __KERNEL_RCSID(0, "$NetBSD: ulfs_dirhash.c,v 1.8 2014/02/25 18:30:13 pooka Exp $");
33 1.1 dholland
34 1.1 dholland /*
35 1.3 dholland * This implements a hash-based lookup scheme for ULFS directories.
36 1.1 dholland */
37 1.1 dholland
38 1.1 dholland #include <sys/param.h>
39 1.1 dholland #include <sys/systm.h>
40 1.1 dholland #include <sys/kernel.h>
41 1.1 dholland #include <sys/kmem.h>
42 1.1 dholland #include <sys/types.h>
43 1.1 dholland #include <sys/hash.h>
44 1.1 dholland #include <sys/proc.h>
45 1.1 dholland #include <sys/buf.h>
46 1.1 dholland #include <sys/vnode.h>
47 1.1 dholland #include <sys/mount.h>
48 1.1 dholland #include <sys/pool.h>
49 1.1 dholland #include <sys/sysctl.h>
50 1.1 dholland #include <sys/atomic.h>
51 1.1 dholland
52 1.2 dholland #include <ufs/lfs/ulfs_inode.h>
53 1.2 dholland #include <ufs/lfs/ulfs_dirhash.h>
54 1.2 dholland #include <ufs/lfs/ulfsmount.h>
55 1.2 dholland #include <ufs/lfs/ulfs_bswap.h>
56 1.2 dholland #include <ufs/lfs/ulfs_extern.h>
57 1.1 dholland
58 1.1 dholland #define WRAPINCR(val, limit) (((val) + 1 == (limit)) ? 0 : ((val) + 1))
59 1.1 dholland #define WRAPDECR(val, limit) (((val) == 0) ? ((limit) - 1) : ((val) - 1))
60 1.7 dholland #define OFSFMT(ip) ((ip)->i_lfs->um_maxsymlinklen <= 0)
61 1.1 dholland #define BLKFREE2IDX(n) ((n) > DH_NFSTATS ? DH_NFSTATS : (n))
62 1.1 dholland
63 1.3 dholland static u_int ulfs_dirhashminblks = 5;
64 1.3 dholland static u_int ulfs_dirhashmaxmem = 2 * 1024 * 1024;
65 1.3 dholland static u_int ulfs_dirhashmem;
66 1.3 dholland static u_int ulfs_dirhashcheck = 0;
67 1.1 dholland
68 1.3 dholland static int ulfsdirhash_hash(struct dirhash *dh, const char *name, int namelen);
69 1.3 dholland static void ulfsdirhash_adjfree(struct dirhash *dh, doff_t offset, int diff,
70 1.1 dholland int dirblksiz);
71 1.3 dholland static void ulfsdirhash_delslot(struct dirhash *dh, int slot);
72 1.3 dholland static int ulfsdirhash_findslot(struct dirhash *dh, const char *name,
73 1.1 dholland int namelen, doff_t offset);
74 1.4 dholland static doff_t ulfsdirhash_getprev(struct lfs_direct *dp, doff_t offset,
75 1.1 dholland int dirblksiz);
76 1.3 dholland static int ulfsdirhash_recycle(int wanted);
77 1.1 dholland
78 1.3 dholland static pool_cache_t ulfsdirhashblk_cache;
79 1.3 dholland static pool_cache_t ulfsdirhash_cache;
80 1.1 dholland
81 1.3 dholland #define DIRHASHLIST_LOCK() mutex_enter(&ulfsdirhash_lock)
82 1.3 dholland #define DIRHASHLIST_UNLOCK() mutex_exit(&ulfsdirhash_lock)
83 1.1 dholland #define DIRHASH_LOCK(dh) mutex_enter(&(dh)->dh_lock)
84 1.1 dholland #define DIRHASH_UNLOCK(dh) mutex_exit(&(dh)->dh_lock)
85 1.1 dholland #define DIRHASH_BLKALLOC() \
86 1.3 dholland pool_cache_get(ulfsdirhashblk_cache, PR_NOWAIT)
87 1.1 dholland #define DIRHASH_BLKFREE(ptr) \
88 1.3 dholland pool_cache_put(ulfsdirhashblk_cache, ptr)
89 1.1 dholland
90 1.1 dholland /* Dirhash list; recently-used entries are near the tail. */
91 1.3 dholland static TAILQ_HEAD(, dirhash) ulfsdirhash_list;
92 1.1 dholland
93 1.3 dholland /* Protects: ulfsdirhash_list, `dh_list' field, ulfs_dirhashmem. */
94 1.3 dholland static kmutex_t ulfsdirhash_lock;
95 1.1 dholland
96 1.3 dholland static struct sysctllog *ulfsdirhash_sysctl_log;
97 1.1 dholland
98 1.1 dholland /*
99 1.1 dholland * Locking order:
100 1.3 dholland * ulfsdirhash_lock
101 1.1 dholland * dh_lock
102 1.1 dholland *
103 1.1 dholland * The dh_lock mutex should be acquired either via the inode lock, or via
104 1.3 dholland * ulfsdirhash_lock. Only the owner of the inode may free the associated
105 1.1 dholland * dirhash, but anything can steal its memory and set dh_hash to NULL.
106 1.1 dholland */
107 1.1 dholland
108 1.1 dholland /*
109 1.1 dholland * Attempt to build up a hash table for the directory contents in
110 1.1 dholland * inode 'ip'. Returns 0 on success, or -1 of the operation failed.
111 1.1 dholland */
112 1.1 dholland int
113 1.3 dholland ulfsdirhash_build(struct inode *ip)
114 1.1 dholland {
115 1.1 dholland struct dirhash *dh;
116 1.1 dholland struct buf *bp = NULL;
117 1.4 dholland struct lfs_direct *ep;
118 1.1 dholland struct vnode *vp;
119 1.1 dholland doff_t bmask, pos;
120 1.1 dholland int dirblocks, i, j, memreqd, nblocks, narrays, nslots, slot;
121 1.7 dholland const int needswap = ULFS_IPNEEDSWAP(ip);
122 1.7 dholland int dirblksiz = ip->i_lfs->um_dirblksiz;
123 1.1 dholland
124 1.1 dholland /* Check if we can/should use dirhash. */
125 1.1 dholland if (ip->i_dirhash == NULL) {
126 1.3 dholland if (ip->i_size < (ulfs_dirhashminblks * dirblksiz) || OFSFMT(ip))
127 1.1 dholland return (-1);
128 1.1 dholland } else {
129 1.1 dholland /* Hash exists, but sysctls could have changed. */
130 1.3 dholland if (ip->i_size < (ulfs_dirhashminblks * dirblksiz) ||
131 1.3 dholland ulfs_dirhashmem > ulfs_dirhashmaxmem) {
132 1.3 dholland ulfsdirhash_free(ip);
133 1.1 dholland return (-1);
134 1.1 dholland }
135 1.1 dholland /* Check if hash exists and is intact (note: unlocked read). */
136 1.1 dholland if (ip->i_dirhash->dh_hash != NULL)
137 1.1 dholland return (0);
138 1.1 dholland /* Free the old, recycled hash and build a new one. */
139 1.3 dholland ulfsdirhash_free(ip);
140 1.1 dholland }
141 1.1 dholland
142 1.1 dholland /* Don't hash removed directories. */
143 1.1 dholland if (ip->i_nlink == 0)
144 1.1 dholland return (-1);
145 1.1 dholland
146 1.1 dholland vp = ip->i_vnode;
147 1.1 dholland /* Allocate 50% more entries than this dir size could ever need. */
148 1.1 dholland KASSERT(ip->i_size >= dirblksiz);
149 1.5 dholland nslots = ip->i_size / LFS_DIRECTSIZ(1);
150 1.1 dholland nslots = (nslots * 3 + 1) / 2;
151 1.1 dholland narrays = howmany(nslots, DH_NBLKOFF);
152 1.1 dholland nslots = narrays * DH_NBLKOFF;
153 1.1 dholland dirblocks = howmany(ip->i_size, dirblksiz);
154 1.1 dholland nblocks = (dirblocks * 3 + 1) / 2;
155 1.1 dholland
156 1.1 dholland memreqd = sizeof(*dh) + narrays * sizeof(*dh->dh_hash) +
157 1.1 dholland narrays * DH_NBLKOFF * sizeof(**dh->dh_hash) +
158 1.1 dholland nblocks * sizeof(*dh->dh_blkfree);
159 1.1 dholland
160 1.3 dholland while (atomic_add_int_nv(&ulfs_dirhashmem, memreqd) >
161 1.3 dholland ulfs_dirhashmaxmem) {
162 1.3 dholland atomic_add_int(&ulfs_dirhashmem, -memreqd);
163 1.3 dholland if (memreqd > ulfs_dirhashmaxmem / 2)
164 1.1 dholland return (-1);
165 1.1 dholland /* Try to free some space. */
166 1.3 dholland if (ulfsdirhash_recycle(memreqd) != 0)
167 1.1 dholland return (-1);
168 1.1 dholland else
169 1.1 dholland DIRHASHLIST_UNLOCK();
170 1.1 dholland }
171 1.1 dholland
172 1.1 dholland /*
173 1.1 dholland * Use non-blocking mallocs so that we will revert to a linear
174 1.1 dholland * lookup on failure rather than potentially blocking forever.
175 1.1 dholland */
176 1.3 dholland dh = pool_cache_get(ulfsdirhash_cache, PR_NOWAIT);
177 1.1 dholland if (dh == NULL) {
178 1.3 dholland atomic_add_int(&ulfs_dirhashmem, -memreqd);
179 1.1 dholland return (-1);
180 1.1 dholland }
181 1.1 dholland memset(dh, 0, sizeof(*dh));
182 1.1 dholland mutex_init(&dh->dh_lock, MUTEX_DEFAULT, IPL_NONE);
183 1.1 dholland DIRHASH_LOCK(dh);
184 1.1 dholland dh->dh_hashsz = narrays * sizeof(dh->dh_hash[0]);
185 1.1 dholland dh->dh_hash = kmem_zalloc(dh->dh_hashsz, KM_NOSLEEP);
186 1.1 dholland dh->dh_blkfreesz = nblocks * sizeof(dh->dh_blkfree[0]);
187 1.1 dholland dh->dh_blkfree = kmem_zalloc(dh->dh_blkfreesz, KM_NOSLEEP);
188 1.1 dholland if (dh->dh_hash == NULL || dh->dh_blkfree == NULL)
189 1.1 dholland goto fail;
190 1.1 dholland for (i = 0; i < narrays; i++) {
191 1.1 dholland if ((dh->dh_hash[i] = DIRHASH_BLKALLOC()) == NULL)
192 1.1 dholland goto fail;
193 1.1 dholland for (j = 0; j < DH_NBLKOFF; j++)
194 1.1 dholland dh->dh_hash[i][j] = DIRHASH_EMPTY;
195 1.1 dholland }
196 1.1 dholland
197 1.1 dholland /* Initialise the hash table and block statistics. */
198 1.1 dholland dh->dh_narrays = narrays;
199 1.1 dholland dh->dh_hlen = nslots;
200 1.1 dholland dh->dh_nblk = nblocks;
201 1.1 dholland dh->dh_dirblks = dirblocks;
202 1.1 dholland for (i = 0; i < dirblocks; i++)
203 1.1 dholland dh->dh_blkfree[i] = dirblksiz / DIRALIGN;
204 1.1 dholland for (i = 0; i < DH_NFSTATS; i++)
205 1.1 dholland dh->dh_firstfree[i] = -1;
206 1.1 dholland dh->dh_firstfree[DH_NFSTATS] = 0;
207 1.1 dholland dh->dh_seqopt = 0;
208 1.1 dholland dh->dh_seqoff = 0;
209 1.1 dholland dh->dh_score = DH_SCOREINIT;
210 1.1 dholland ip->i_dirhash = dh;
211 1.1 dholland
212 1.3 dholland bmask = VFSTOULFS(vp->v_mount)->um_mountp->mnt_stat.f_iosize - 1;
213 1.1 dholland pos = 0;
214 1.1 dholland while (pos < ip->i_size) {
215 1.1 dholland if ((curcpu()->ci_schedstate.spc_flags & SPCF_SHOULDYIELD)
216 1.1 dholland != 0) {
217 1.1 dholland preempt();
218 1.1 dholland }
219 1.1 dholland /* If necessary, get the next directory block. */
220 1.1 dholland if ((pos & bmask) == 0) {
221 1.1 dholland if (bp != NULL)
222 1.1 dholland brelse(bp, 0);
223 1.3 dholland if (ulfs_blkatoff(vp, (off_t)pos, NULL, &bp, false) != 0)
224 1.1 dholland goto fail;
225 1.1 dholland }
226 1.1 dholland
227 1.1 dholland /* Add this entry to the hash. */
228 1.4 dholland ep = (struct lfs_direct *)((char *)bp->b_data + (pos & bmask));
229 1.1 dholland if (ep->d_reclen == 0 || ep->d_reclen >
230 1.1 dholland dirblksiz - (pos & (dirblksiz - 1))) {
231 1.1 dholland /* Corrupted directory. */
232 1.1 dholland brelse(bp, 0);
233 1.1 dholland goto fail;
234 1.1 dholland }
235 1.1 dholland if (ep->d_ino != 0) {
236 1.3 dholland /* Add the entry (simplified ulfsdirhash_add). */
237 1.3 dholland slot = ulfsdirhash_hash(dh, ep->d_name, ep->d_namlen);
238 1.1 dholland while (DH_ENTRY(dh, slot) != DIRHASH_EMPTY)
239 1.1 dholland slot = WRAPINCR(slot, dh->dh_hlen);
240 1.1 dholland dh->dh_hused++;
241 1.1 dholland DH_ENTRY(dh, slot) = pos;
242 1.5 dholland ulfsdirhash_adjfree(dh, pos, -LFS_DIRSIZ(0, ep, needswap),
243 1.1 dholland dirblksiz);
244 1.1 dholland }
245 1.1 dholland pos += ep->d_reclen;
246 1.1 dholland }
247 1.1 dholland
248 1.1 dholland if (bp != NULL)
249 1.1 dholland brelse(bp, 0);
250 1.1 dholland DIRHASHLIST_LOCK();
251 1.3 dholland TAILQ_INSERT_TAIL(&ulfsdirhash_list, dh, dh_list);
252 1.1 dholland dh->dh_onlist = 1;
253 1.1 dholland DIRHASH_UNLOCK(dh);
254 1.1 dholland DIRHASHLIST_UNLOCK();
255 1.1 dholland return (0);
256 1.1 dholland
257 1.1 dholland fail:
258 1.1 dholland DIRHASH_UNLOCK(dh);
259 1.1 dholland if (dh->dh_hash != NULL) {
260 1.1 dholland for (i = 0; i < narrays; i++)
261 1.1 dholland if (dh->dh_hash[i] != NULL)
262 1.1 dholland DIRHASH_BLKFREE(dh->dh_hash[i]);
263 1.1 dholland kmem_free(dh->dh_hash, dh->dh_hashsz);
264 1.1 dholland }
265 1.1 dholland if (dh->dh_blkfree != NULL)
266 1.1 dholland kmem_free(dh->dh_blkfree, dh->dh_blkfreesz);
267 1.1 dholland mutex_destroy(&dh->dh_lock);
268 1.3 dholland pool_cache_put(ulfsdirhash_cache, dh);
269 1.1 dholland ip->i_dirhash = NULL;
270 1.3 dholland atomic_add_int(&ulfs_dirhashmem, -memreqd);
271 1.1 dholland return (-1);
272 1.1 dholland }
273 1.1 dholland
274 1.1 dholland /*
275 1.1 dholland * Free any hash table associated with inode 'ip'.
276 1.1 dholland */
277 1.1 dholland void
278 1.3 dholland ulfsdirhash_free(struct inode *ip)
279 1.1 dholland {
280 1.1 dholland struct dirhash *dh;
281 1.1 dholland int i, mem;
282 1.1 dholland
283 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
284 1.1 dholland return;
285 1.1 dholland
286 1.1 dholland if (dh->dh_onlist) {
287 1.1 dholland DIRHASHLIST_LOCK();
288 1.1 dholland if (dh->dh_onlist)
289 1.3 dholland TAILQ_REMOVE(&ulfsdirhash_list, dh, dh_list);
290 1.1 dholland DIRHASHLIST_UNLOCK();
291 1.1 dholland }
292 1.1 dholland
293 1.1 dholland /* The dirhash pointed to by 'dh' is exclusively ours now. */
294 1.1 dholland mem = sizeof(*dh);
295 1.1 dholland if (dh->dh_hash != NULL) {
296 1.1 dholland for (i = 0; i < dh->dh_narrays; i++)
297 1.1 dholland DIRHASH_BLKFREE(dh->dh_hash[i]);
298 1.1 dholland kmem_free(dh->dh_hash, dh->dh_hashsz);
299 1.1 dholland kmem_free(dh->dh_blkfree, dh->dh_blkfreesz);
300 1.1 dholland mem += dh->dh_hashsz;
301 1.1 dholland mem += dh->dh_narrays * DH_NBLKOFF * sizeof(**dh->dh_hash);
302 1.1 dholland mem += dh->dh_nblk * sizeof(*dh->dh_blkfree);
303 1.1 dholland }
304 1.1 dholland mutex_destroy(&dh->dh_lock);
305 1.3 dholland pool_cache_put(ulfsdirhash_cache, dh);
306 1.1 dholland ip->i_dirhash = NULL;
307 1.1 dholland
308 1.3 dholland atomic_add_int(&ulfs_dirhashmem, -mem);
309 1.1 dholland }
310 1.1 dholland
311 1.1 dholland /*
312 1.1 dholland * Find the offset of the specified name within the given inode.
313 1.1 dholland * Returns 0 on success, ENOENT if the entry does not exist, or
314 1.1 dholland * EJUSTRETURN if the caller should revert to a linear search.
315 1.1 dholland *
316 1.1 dholland * If successful, the directory offset is stored in *offp, and a
317 1.1 dholland * pointer to a struct buf containing the entry is stored in *bpp. If
318 1.1 dholland * prevoffp is non-NULL, the offset of the previous entry within
319 1.1 dholland * the DIRBLKSIZ-sized block is stored in *prevoffp (if the entry
320 1.1 dholland * is the first in a block, the start of the block is used).
321 1.1 dholland */
322 1.1 dholland int
323 1.3 dholland ulfsdirhash_lookup(struct inode *ip, const char *name, int namelen, doff_t *offp,
324 1.1 dholland struct buf **bpp, doff_t *prevoffp)
325 1.1 dholland {
326 1.1 dholland struct dirhash *dh, *dh_next;
327 1.4 dholland struct lfs_direct *dp;
328 1.1 dholland struct vnode *vp;
329 1.1 dholland struct buf *bp;
330 1.1 dholland doff_t blkoff, bmask, offset, prevoff;
331 1.1 dholland int i, slot;
332 1.7 dholland const int needswap = ULFS_IPNEEDSWAP(ip);
333 1.7 dholland int dirblksiz = ip->i_lfs->um_dirblksiz;
334 1.1 dholland
335 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
336 1.1 dholland return (EJUSTRETURN);
337 1.1 dholland
338 1.1 dholland /*
339 1.1 dholland * Move this dirhash towards the end of the list if it has a
340 1.1 dholland * score higher than the next entry, and acquire the dh_lock.
341 1.1 dholland * Optimise the case where it's already the last by performing
342 1.1 dholland * an unlocked read of the TAILQ_NEXT pointer.
343 1.1 dholland *
344 1.1 dholland * In both cases, end up holding just dh_lock.
345 1.1 dholland */
346 1.1 dholland if (TAILQ_NEXT(dh, dh_list) != NULL) {
347 1.1 dholland DIRHASHLIST_LOCK();
348 1.1 dholland DIRHASH_LOCK(dh);
349 1.1 dholland /*
350 1.1 dholland * If the new score will be greater than that of the next
351 1.1 dholland * entry, then move this entry past it. With both mutexes
352 1.1 dholland * held, dh_next won't go away, but its dh_score could
353 1.1 dholland * change; that's not important since it is just a hint.
354 1.1 dholland */
355 1.1 dholland if (dh->dh_hash != NULL &&
356 1.1 dholland (dh_next = TAILQ_NEXT(dh, dh_list)) != NULL &&
357 1.1 dholland dh->dh_score >= dh_next->dh_score) {
358 1.1 dholland KASSERT(dh->dh_onlist);
359 1.3 dholland TAILQ_REMOVE(&ulfsdirhash_list, dh, dh_list);
360 1.3 dholland TAILQ_INSERT_AFTER(&ulfsdirhash_list, dh_next, dh,
361 1.1 dholland dh_list);
362 1.1 dholland }
363 1.1 dholland DIRHASHLIST_UNLOCK();
364 1.1 dholland } else {
365 1.1 dholland /* Already the last, though that could change as we wait. */
366 1.1 dholland DIRHASH_LOCK(dh);
367 1.1 dholland }
368 1.1 dholland if (dh->dh_hash == NULL) {
369 1.1 dholland DIRHASH_UNLOCK(dh);
370 1.3 dholland ulfsdirhash_free(ip);
371 1.1 dholland return (EJUSTRETURN);
372 1.1 dholland }
373 1.1 dholland
374 1.1 dholland /* Update the score. */
375 1.1 dholland if (dh->dh_score < DH_SCOREMAX)
376 1.1 dholland dh->dh_score++;
377 1.1 dholland
378 1.1 dholland vp = ip->i_vnode;
379 1.3 dholland bmask = VFSTOULFS(vp->v_mount)->um_mountp->mnt_stat.f_iosize - 1;
380 1.1 dholland blkoff = -1;
381 1.1 dholland bp = NULL;
382 1.1 dholland restart:
383 1.3 dholland slot = ulfsdirhash_hash(dh, name, namelen);
384 1.1 dholland
385 1.1 dholland if (dh->dh_seqopt) {
386 1.1 dholland /*
387 1.1 dholland * Sequential access optimisation. dh_seqoff contains the
388 1.1 dholland * offset of the directory entry immediately following
389 1.1 dholland * the last entry that was looked up. Check if this offset
390 1.1 dholland * appears in the hash chain for the name we are looking for.
391 1.1 dholland */
392 1.1 dholland for (i = slot; (offset = DH_ENTRY(dh, i)) != DIRHASH_EMPTY;
393 1.1 dholland i = WRAPINCR(i, dh->dh_hlen))
394 1.1 dholland if (offset == dh->dh_seqoff)
395 1.1 dholland break;
396 1.1 dholland if (offset == dh->dh_seqoff) {
397 1.1 dholland /*
398 1.1 dholland * We found an entry with the expected offset. This
399 1.1 dholland * is probably the entry we want, but if not, the
400 1.1 dholland * code below will turn off seqoff and retry.
401 1.1 dholland */
402 1.1 dholland slot = i;
403 1.1 dholland } else
404 1.1 dholland dh->dh_seqopt = 0;
405 1.1 dholland }
406 1.1 dholland
407 1.1 dholland for (; (offset = DH_ENTRY(dh, slot)) != DIRHASH_EMPTY;
408 1.1 dholland slot = WRAPINCR(slot, dh->dh_hlen)) {
409 1.1 dholland if (offset == DIRHASH_DEL)
410 1.1 dholland continue;
411 1.1 dholland
412 1.1 dholland if (offset < 0 || offset >= ip->i_size)
413 1.3 dholland panic("ulfsdirhash_lookup: bad offset in hash array");
414 1.1 dholland if ((offset & ~bmask) != blkoff) {
415 1.1 dholland if (bp != NULL)
416 1.1 dholland brelse(bp, 0);
417 1.1 dholland blkoff = offset & ~bmask;
418 1.3 dholland if (ulfs_blkatoff(vp, (off_t)blkoff,
419 1.1 dholland NULL, &bp, false) != 0) {
420 1.1 dholland DIRHASH_UNLOCK(dh);
421 1.1 dholland return (EJUSTRETURN);
422 1.1 dholland }
423 1.1 dholland }
424 1.4 dholland dp = (struct lfs_direct *)((char *)bp->b_data + (offset & bmask));
425 1.1 dholland if (dp->d_reclen == 0 || dp->d_reclen >
426 1.1 dholland dirblksiz - (offset & (dirblksiz - 1))) {
427 1.1 dholland /* Corrupted directory. */
428 1.1 dholland DIRHASH_UNLOCK(dh);
429 1.1 dholland brelse(bp, 0);
430 1.1 dholland return (EJUSTRETURN);
431 1.1 dholland }
432 1.1 dholland if (dp->d_namlen == namelen &&
433 1.1 dholland memcmp(dp->d_name, name, namelen) == 0) {
434 1.1 dholland /* Found. Get the prev offset if needed. */
435 1.1 dholland if (prevoffp != NULL) {
436 1.1 dholland if (offset & (dirblksiz - 1)) {
437 1.3 dholland prevoff = ulfsdirhash_getprev(dp,
438 1.1 dholland offset, dirblksiz);
439 1.1 dholland if (prevoff == -1) {
440 1.1 dholland brelse(bp, 0);
441 1.1 dholland return (EJUSTRETURN);
442 1.1 dholland }
443 1.1 dholland } else
444 1.1 dholland prevoff = offset;
445 1.1 dholland *prevoffp = prevoff;
446 1.1 dholland }
447 1.1 dholland
448 1.1 dholland /* Check for sequential access, and update offset. */
449 1.1 dholland if (dh->dh_seqopt == 0 && dh->dh_seqoff == offset)
450 1.1 dholland dh->dh_seqopt = 1;
451 1.5 dholland dh->dh_seqoff = offset + LFS_DIRSIZ(0, dp, needswap);
452 1.1 dholland DIRHASH_UNLOCK(dh);
453 1.1 dholland
454 1.1 dholland *bpp = bp;
455 1.1 dholland *offp = offset;
456 1.1 dholland return (0);
457 1.1 dholland }
458 1.1 dholland
459 1.1 dholland if (dh->dh_hash == NULL) {
460 1.1 dholland DIRHASH_UNLOCK(dh);
461 1.1 dholland if (bp != NULL)
462 1.1 dholland brelse(bp, 0);
463 1.3 dholland ulfsdirhash_free(ip);
464 1.1 dholland return (EJUSTRETURN);
465 1.1 dholland }
466 1.1 dholland /*
467 1.1 dholland * When the name doesn't match in the seqopt case, go back
468 1.1 dholland * and search normally.
469 1.1 dholland */
470 1.1 dholland if (dh->dh_seqopt) {
471 1.1 dholland dh->dh_seqopt = 0;
472 1.1 dholland goto restart;
473 1.1 dholland }
474 1.1 dholland }
475 1.1 dholland DIRHASH_UNLOCK(dh);
476 1.1 dholland if (bp != NULL)
477 1.1 dholland brelse(bp, 0);
478 1.1 dholland return (ENOENT);
479 1.1 dholland }
480 1.1 dholland
481 1.1 dholland /*
482 1.1 dholland * Find a directory block with room for 'slotneeded' bytes. Returns
483 1.1 dholland * the offset of the directory entry that begins the free space.
484 1.1 dholland * This will either be the offset of an existing entry that has free
485 1.1 dholland * space at the end, or the offset of an entry with d_ino == 0 at
486 1.1 dholland * the start of a DIRBLKSIZ block.
487 1.1 dholland *
488 1.1 dholland * To use the space, the caller may need to compact existing entries in
489 1.1 dholland * the directory. The total number of bytes in all of the entries involved
490 1.1 dholland * in the compaction is stored in *slotsize. In other words, all of
491 1.1 dholland * the entries that must be compacted are exactly contained in the
492 1.1 dholland * region beginning at the returned offset and spanning *slotsize bytes.
493 1.1 dholland *
494 1.1 dholland * Returns -1 if no space was found, indicating that the directory
495 1.1 dholland * must be extended.
496 1.1 dholland */
497 1.1 dholland doff_t
498 1.3 dholland ulfsdirhash_findfree(struct inode *ip, int slotneeded, int *slotsize)
499 1.1 dholland {
500 1.4 dholland struct lfs_direct *dp;
501 1.1 dholland struct dirhash *dh;
502 1.1 dholland struct buf *bp;
503 1.1 dholland doff_t pos, slotstart;
504 1.1 dholland int dirblock, error, freebytes, i;
505 1.7 dholland const int needswap = ULFS_IPNEEDSWAP(ip);
506 1.7 dholland int dirblksiz = ip->i_lfs->um_dirblksiz;
507 1.1 dholland
508 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
509 1.1 dholland return (-1);
510 1.1 dholland
511 1.1 dholland DIRHASH_LOCK(dh);
512 1.1 dholland if (dh->dh_hash == NULL) {
513 1.1 dholland DIRHASH_UNLOCK(dh);
514 1.3 dholland ulfsdirhash_free(ip);
515 1.1 dholland return (-1);
516 1.1 dholland }
517 1.1 dholland
518 1.1 dholland /* Find a directory block with the desired free space. */
519 1.1 dholland dirblock = -1;
520 1.1 dholland for (i = howmany(slotneeded, DIRALIGN); i <= DH_NFSTATS; i++)
521 1.1 dholland if ((dirblock = dh->dh_firstfree[i]) != -1)
522 1.1 dholland break;
523 1.1 dholland if (dirblock == -1) {
524 1.1 dholland DIRHASH_UNLOCK(dh);
525 1.1 dholland return (-1);
526 1.1 dholland }
527 1.1 dholland
528 1.1 dholland KASSERT(dirblock < dh->dh_nblk &&
529 1.1 dholland dh->dh_blkfree[dirblock] >= howmany(slotneeded, DIRALIGN));
530 1.1 dholland pos = dirblock * dirblksiz;
531 1.3 dholland error = ulfs_blkatoff(ip->i_vnode, (off_t)pos, (void *)&dp, &bp, false);
532 1.1 dholland if (error) {
533 1.1 dholland DIRHASH_UNLOCK(dh);
534 1.1 dholland return (-1);
535 1.1 dholland }
536 1.1 dholland /* Find the first entry with free space. */
537 1.1 dholland for (i = 0; i < dirblksiz; ) {
538 1.1 dholland if (dp->d_reclen == 0) {
539 1.1 dholland DIRHASH_UNLOCK(dh);
540 1.1 dholland brelse(bp, 0);
541 1.1 dholland return (-1);
542 1.1 dholland }
543 1.5 dholland if (dp->d_ino == 0 || dp->d_reclen > LFS_DIRSIZ(0, dp, needswap))
544 1.1 dholland break;
545 1.1 dholland i += dp->d_reclen;
546 1.4 dholland dp = (struct lfs_direct *)((char *)dp + dp->d_reclen);
547 1.1 dholland }
548 1.1 dholland if (i > dirblksiz) {
549 1.1 dholland DIRHASH_UNLOCK(dh);
550 1.1 dholland brelse(bp, 0);
551 1.1 dholland return (-1);
552 1.1 dholland }
553 1.1 dholland slotstart = pos + i;
554 1.1 dholland
555 1.1 dholland /* Find the range of entries needed to get enough space */
556 1.1 dholland freebytes = 0;
557 1.1 dholland while (i < dirblksiz && freebytes < slotneeded) {
558 1.1 dholland freebytes += dp->d_reclen;
559 1.1 dholland if (dp->d_ino != 0)
560 1.5 dholland freebytes -= LFS_DIRSIZ(0, dp, needswap);
561 1.1 dholland if (dp->d_reclen == 0) {
562 1.1 dholland DIRHASH_UNLOCK(dh);
563 1.1 dholland brelse(bp, 0);
564 1.1 dholland return (-1);
565 1.1 dholland }
566 1.1 dholland i += dp->d_reclen;
567 1.4 dholland dp = (struct lfs_direct *)((char *)dp + dp->d_reclen);
568 1.1 dholland }
569 1.1 dholland if (i > dirblksiz) {
570 1.1 dholland DIRHASH_UNLOCK(dh);
571 1.1 dholland brelse(bp, 0);
572 1.1 dholland return (-1);
573 1.1 dholland }
574 1.1 dholland if (freebytes < slotneeded)
575 1.3 dholland panic("ulfsdirhash_findfree: free mismatch");
576 1.1 dholland DIRHASH_UNLOCK(dh);
577 1.1 dholland brelse(bp, 0);
578 1.1 dholland *slotsize = pos + i - slotstart;
579 1.1 dholland return (slotstart);
580 1.1 dholland }
581 1.1 dholland
582 1.1 dholland /*
583 1.1 dholland * Return the start of the unused space at the end of a directory, or
584 1.1 dholland * -1 if there are no trailing unused blocks.
585 1.1 dholland */
586 1.1 dholland doff_t
587 1.3 dholland ulfsdirhash_enduseful(struct inode *ip)
588 1.1 dholland {
589 1.1 dholland struct dirhash *dh;
590 1.1 dholland int i;
591 1.7 dholland int dirblksiz = ip->i_lfs->um_dirblksiz;
592 1.1 dholland
593 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
594 1.1 dholland return (-1);
595 1.1 dholland
596 1.1 dholland DIRHASH_LOCK(dh);
597 1.1 dholland if (dh->dh_hash == NULL) {
598 1.1 dholland DIRHASH_UNLOCK(dh);
599 1.3 dholland ulfsdirhash_free(ip);
600 1.1 dholland return (-1);
601 1.1 dholland }
602 1.1 dholland
603 1.1 dholland if (dh->dh_blkfree[dh->dh_dirblks - 1] != dirblksiz / DIRALIGN) {
604 1.1 dholland DIRHASH_UNLOCK(dh);
605 1.1 dholland return (-1);
606 1.1 dholland }
607 1.1 dholland
608 1.1 dholland for (i = dh->dh_dirblks - 1; i >= 0; i--)
609 1.1 dholland if (dh->dh_blkfree[i] != dirblksiz / DIRALIGN)
610 1.1 dholland break;
611 1.1 dholland DIRHASH_UNLOCK(dh);
612 1.1 dholland return ((doff_t)(i + 1) * dirblksiz);
613 1.1 dholland }
614 1.1 dholland
615 1.1 dholland /*
616 1.1 dholland * Insert information into the hash about a new directory entry. dirp
617 1.4 dholland * points to a struct lfs_direct containing the entry, and offset specifies
618 1.1 dholland * the offset of this entry.
619 1.1 dholland */
620 1.1 dholland void
621 1.4 dholland ulfsdirhash_add(struct inode *ip, struct lfs_direct *dirp, doff_t offset)
622 1.1 dholland {
623 1.1 dholland struct dirhash *dh;
624 1.1 dholland int slot;
625 1.7 dholland const int needswap = ULFS_IPNEEDSWAP(ip);
626 1.7 dholland int dirblksiz = ip->i_lfs->um_dirblksiz;
627 1.1 dholland
628 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
629 1.1 dholland return;
630 1.1 dholland
631 1.1 dholland DIRHASH_LOCK(dh);
632 1.1 dholland if (dh->dh_hash == NULL) {
633 1.1 dholland DIRHASH_UNLOCK(dh);
634 1.3 dholland ulfsdirhash_free(ip);
635 1.1 dholland return;
636 1.1 dholland }
637 1.1 dholland
638 1.1 dholland KASSERT(offset < dh->dh_dirblks * dirblksiz);
639 1.1 dholland /*
640 1.1 dholland * Normal hash usage is < 66%. If the usage gets too high then
641 1.1 dholland * remove the hash entirely and let it be rebuilt later.
642 1.1 dholland */
643 1.1 dholland if (dh->dh_hused >= (dh->dh_hlen * 3) / 4) {
644 1.1 dholland DIRHASH_UNLOCK(dh);
645 1.3 dholland ulfsdirhash_free(ip);
646 1.1 dholland return;
647 1.1 dholland }
648 1.1 dholland
649 1.1 dholland /* Find a free hash slot (empty or deleted), and add the entry. */
650 1.3 dholland slot = ulfsdirhash_hash(dh, dirp->d_name, dirp->d_namlen);
651 1.1 dholland while (DH_ENTRY(dh, slot) >= 0)
652 1.1 dholland slot = WRAPINCR(slot, dh->dh_hlen);
653 1.1 dholland if (DH_ENTRY(dh, slot) == DIRHASH_EMPTY)
654 1.1 dholland dh->dh_hused++;
655 1.1 dholland DH_ENTRY(dh, slot) = offset;
656 1.1 dholland
657 1.1 dholland /* Update the per-block summary info. */
658 1.5 dholland ulfsdirhash_adjfree(dh, offset, -LFS_DIRSIZ(0, dirp, needswap), dirblksiz);
659 1.1 dholland DIRHASH_UNLOCK(dh);
660 1.1 dholland }
661 1.1 dholland
662 1.1 dholland /*
663 1.1 dholland * Remove the specified directory entry from the hash. The entry to remove
664 1.1 dholland * is defined by the name in `dirp', which must exist at the specified
665 1.1 dholland * `offset' within the directory.
666 1.1 dholland */
667 1.1 dholland void
668 1.4 dholland ulfsdirhash_remove(struct inode *ip, struct lfs_direct *dirp, doff_t offset)
669 1.1 dholland {
670 1.1 dholland struct dirhash *dh;
671 1.1 dholland int slot;
672 1.7 dholland const int needswap = ULFS_IPNEEDSWAP(ip);
673 1.7 dholland int dirblksiz = ip->i_lfs->um_dirblksiz;
674 1.1 dholland
675 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
676 1.1 dholland return;
677 1.1 dholland
678 1.1 dholland DIRHASH_LOCK(dh);
679 1.1 dholland if (dh->dh_hash == NULL) {
680 1.1 dholland DIRHASH_UNLOCK(dh);
681 1.3 dholland ulfsdirhash_free(ip);
682 1.1 dholland return;
683 1.1 dholland }
684 1.1 dholland
685 1.1 dholland KASSERT(offset < dh->dh_dirblks * dirblksiz);
686 1.1 dholland /* Find the entry */
687 1.3 dholland slot = ulfsdirhash_findslot(dh, dirp->d_name, dirp->d_namlen, offset);
688 1.1 dholland
689 1.1 dholland /* Remove the hash entry. */
690 1.3 dholland ulfsdirhash_delslot(dh, slot);
691 1.1 dholland
692 1.1 dholland /* Update the per-block summary info. */
693 1.5 dholland ulfsdirhash_adjfree(dh, offset, LFS_DIRSIZ(0, dirp, needswap), dirblksiz);
694 1.1 dholland DIRHASH_UNLOCK(dh);
695 1.1 dholland }
696 1.1 dholland
697 1.1 dholland /*
698 1.1 dholland * Change the offset associated with a directory entry in the hash. Used
699 1.1 dholland * when compacting directory blocks.
700 1.1 dholland */
701 1.1 dholland void
702 1.4 dholland ulfsdirhash_move(struct inode *ip, struct lfs_direct *dirp, doff_t oldoff,
703 1.1 dholland doff_t newoff)
704 1.1 dholland {
705 1.1 dholland struct dirhash *dh;
706 1.1 dholland int slot;
707 1.1 dholland
708 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
709 1.1 dholland return;
710 1.1 dholland DIRHASH_LOCK(dh);
711 1.1 dholland if (dh->dh_hash == NULL) {
712 1.1 dholland DIRHASH_UNLOCK(dh);
713 1.3 dholland ulfsdirhash_free(ip);
714 1.1 dholland return;
715 1.1 dholland }
716 1.1 dholland
717 1.7 dholland KASSERT(oldoff < dh->dh_dirblks * ip->i_lfs->um_dirblksiz &&
718 1.7 dholland newoff < dh->dh_dirblks * ip->i_lfs->um_dirblksiz);
719 1.1 dholland /* Find the entry, and update the offset. */
720 1.3 dholland slot = ulfsdirhash_findslot(dh, dirp->d_name, dirp->d_namlen, oldoff);
721 1.1 dholland DH_ENTRY(dh, slot) = newoff;
722 1.1 dholland DIRHASH_UNLOCK(dh);
723 1.1 dholland }
724 1.1 dholland
725 1.1 dholland /*
726 1.1 dholland * Inform dirhash that the directory has grown by one block that
727 1.1 dholland * begins at offset (i.e. the new length is offset + DIRBLKSIZ).
728 1.1 dholland */
729 1.1 dholland void
730 1.3 dholland ulfsdirhash_newblk(struct inode *ip, doff_t offset)
731 1.1 dholland {
732 1.1 dholland struct dirhash *dh;
733 1.1 dholland int block;
734 1.7 dholland int dirblksiz = ip->i_lfs->um_dirblksiz;
735 1.1 dholland
736 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
737 1.1 dholland return;
738 1.1 dholland DIRHASH_LOCK(dh);
739 1.1 dholland if (dh->dh_hash == NULL) {
740 1.1 dholland DIRHASH_UNLOCK(dh);
741 1.3 dholland ulfsdirhash_free(ip);
742 1.1 dholland return;
743 1.1 dholland }
744 1.1 dholland
745 1.1 dholland KASSERT(offset == dh->dh_dirblks * dirblksiz);
746 1.1 dholland block = offset / dirblksiz;
747 1.1 dholland if (block >= dh->dh_nblk) {
748 1.1 dholland /* Out of space; must rebuild. */
749 1.1 dholland DIRHASH_UNLOCK(dh);
750 1.3 dholland ulfsdirhash_free(ip);
751 1.1 dholland return;
752 1.1 dholland }
753 1.1 dholland dh->dh_dirblks = block + 1;
754 1.1 dholland
755 1.1 dholland /* Account for the new free block. */
756 1.1 dholland dh->dh_blkfree[block] = dirblksiz / DIRALIGN;
757 1.1 dholland if (dh->dh_firstfree[DH_NFSTATS] == -1)
758 1.1 dholland dh->dh_firstfree[DH_NFSTATS] = block;
759 1.1 dholland DIRHASH_UNLOCK(dh);
760 1.1 dholland }
761 1.1 dholland
762 1.1 dholland /*
763 1.1 dholland * Inform dirhash that the directory is being truncated.
764 1.1 dholland */
765 1.1 dholland void
766 1.3 dholland ulfsdirhash_dirtrunc(struct inode *ip, doff_t offset)
767 1.1 dholland {
768 1.1 dholland struct dirhash *dh;
769 1.1 dholland int block, i;
770 1.7 dholland int dirblksiz = ip->i_lfs->um_dirblksiz;
771 1.1 dholland
772 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
773 1.1 dholland return;
774 1.1 dholland
775 1.1 dholland DIRHASH_LOCK(dh);
776 1.1 dholland if (dh->dh_hash == NULL) {
777 1.1 dholland DIRHASH_UNLOCK(dh);
778 1.3 dholland ulfsdirhash_free(ip);
779 1.1 dholland return;
780 1.1 dholland }
781 1.1 dholland
782 1.1 dholland KASSERT(offset <= dh->dh_dirblks * dirblksiz);
783 1.1 dholland block = howmany(offset, dirblksiz);
784 1.1 dholland /*
785 1.1 dholland * If the directory shrinks to less than 1/8 of dh_nblk blocks
786 1.1 dholland * (about 20% of its original size due to the 50% extra added in
787 1.3 dholland * ulfsdirhash_build) then free it, and let the caller rebuild
788 1.1 dholland * if necessary.
789 1.1 dholland */
790 1.1 dholland if (block < dh->dh_nblk / 8 && dh->dh_narrays > 1) {
791 1.1 dholland DIRHASH_UNLOCK(dh);
792 1.3 dholland ulfsdirhash_free(ip);
793 1.1 dholland return;
794 1.1 dholland }
795 1.1 dholland
796 1.1 dholland /*
797 1.1 dholland * Remove any `first free' information pertaining to the
798 1.1 dholland * truncated blocks. All blocks we're removing should be
799 1.1 dholland * completely unused.
800 1.1 dholland */
801 1.1 dholland if (dh->dh_firstfree[DH_NFSTATS] >= block)
802 1.1 dholland dh->dh_firstfree[DH_NFSTATS] = -1;
803 1.1 dholland for (i = block; i < dh->dh_dirblks; i++)
804 1.1 dholland if (dh->dh_blkfree[i] != dirblksiz / DIRALIGN)
805 1.3 dholland panic("ulfsdirhash_dirtrunc: blocks in use");
806 1.1 dholland for (i = 0; i < DH_NFSTATS; i++)
807 1.1 dholland if (dh->dh_firstfree[i] >= block)
808 1.3 dholland panic("ulfsdirhash_dirtrunc: first free corrupt");
809 1.1 dholland dh->dh_dirblks = block;
810 1.1 dholland DIRHASH_UNLOCK(dh);
811 1.1 dholland }
812 1.1 dholland
813 1.1 dholland /*
814 1.1 dholland * Debugging function to check that the dirhash information about
815 1.1 dholland * a directory block matches its actual contents. Panics if a mismatch
816 1.1 dholland * is detected.
817 1.1 dholland *
818 1.1 dholland * On entry, `sbuf' should point to the start of an in-core
819 1.1 dholland * DIRBLKSIZ-sized directory block, and `offset' should contain the
820 1.1 dholland * offset from the start of the directory of that block.
821 1.1 dholland */
822 1.1 dholland void
823 1.3 dholland ulfsdirhash_checkblock(struct inode *ip, char *sbuf, doff_t offset)
824 1.1 dholland {
825 1.1 dholland struct dirhash *dh;
826 1.4 dholland struct lfs_direct *dp;
827 1.1 dholland int block, ffslot, i, nfree;
828 1.7 dholland const int needswap = ULFS_IPNEEDSWAP(ip);
829 1.7 dholland int dirblksiz = ip->i_lfs->um_dirblksiz;
830 1.1 dholland
831 1.3 dholland if (!ulfs_dirhashcheck)
832 1.1 dholland return;
833 1.1 dholland if ((dh = ip->i_dirhash) == NULL)
834 1.1 dholland return;
835 1.1 dholland
836 1.1 dholland DIRHASH_LOCK(dh);
837 1.1 dholland if (dh->dh_hash == NULL) {
838 1.1 dholland DIRHASH_UNLOCK(dh);
839 1.3 dholland ulfsdirhash_free(ip);
840 1.1 dholland return;
841 1.1 dholland }
842 1.1 dholland
843 1.1 dholland block = offset / dirblksiz;
844 1.1 dholland if ((offset & (dirblksiz - 1)) != 0 || block >= dh->dh_dirblks)
845 1.3 dholland panic("ulfsdirhash_checkblock: bad offset");
846 1.1 dholland
847 1.1 dholland nfree = 0;
848 1.1 dholland for (i = 0; i < dirblksiz; i += dp->d_reclen) {
849 1.4 dholland dp = (struct lfs_direct *)(sbuf + i);
850 1.1 dholland if (dp->d_reclen == 0 || i + dp->d_reclen > dirblksiz)
851 1.3 dholland panic("ulfsdirhash_checkblock: bad dir");
852 1.1 dholland
853 1.1 dholland if (dp->d_ino == 0) {
854 1.1 dholland #if 0
855 1.1 dholland /*
856 1.1 dholland * XXX entries with d_ino == 0 should only occur
857 1.1 dholland * at the start of a DIRBLKSIZ block. However the
858 1.3 dholland * ulfs code is tolerant of such entries at other
859 1.1 dholland * offsets, and fsck does not fix them.
860 1.1 dholland */
861 1.1 dholland if (i != 0)
862 1.3 dholland panic("ulfsdirhash_checkblock: bad dir inode");
863 1.1 dholland #endif
864 1.1 dholland nfree += dp->d_reclen;
865 1.1 dholland continue;
866 1.1 dholland }
867 1.1 dholland
868 1.1 dholland /* Check that the entry exists (will panic if it doesn't). */
869 1.3 dholland ulfsdirhash_findslot(dh, dp->d_name, dp->d_namlen, offset + i);
870 1.1 dholland
871 1.5 dholland nfree += dp->d_reclen - LFS_DIRSIZ(0, dp, needswap);
872 1.1 dholland }
873 1.1 dholland if (i != dirblksiz)
874 1.3 dholland panic("ulfsdirhash_checkblock: bad dir end");
875 1.1 dholland
876 1.1 dholland if (dh->dh_blkfree[block] * DIRALIGN != nfree)
877 1.3 dholland panic("ulfsdirhash_checkblock: bad free count");
878 1.1 dholland
879 1.1 dholland ffslot = BLKFREE2IDX(nfree / DIRALIGN);
880 1.1 dholland for (i = 0; i <= DH_NFSTATS; i++)
881 1.1 dholland if (dh->dh_firstfree[i] == block && i != ffslot)
882 1.3 dholland panic("ulfsdirhash_checkblock: bad first-free");
883 1.1 dholland if (dh->dh_firstfree[ffslot] == -1)
884 1.3 dholland panic("ulfsdirhash_checkblock: missing first-free entry");
885 1.1 dholland DIRHASH_UNLOCK(dh);
886 1.1 dholland }
887 1.1 dholland
888 1.1 dholland /*
889 1.1 dholland * Hash the specified filename into a dirhash slot.
890 1.1 dholland */
891 1.1 dholland static int
892 1.3 dholland ulfsdirhash_hash(struct dirhash *dh, const char *name, int namelen)
893 1.1 dholland {
894 1.1 dholland u_int32_t hash;
895 1.1 dholland
896 1.1 dholland /*
897 1.1 dholland * We hash the name and then some other bit of data that is
898 1.1 dholland * invariant over the dirhash's lifetime. Otherwise names
899 1.1 dholland * differing only in the last byte are placed close to one
900 1.1 dholland * another in the table, which is bad for linear probing.
901 1.1 dholland */
902 1.1 dholland hash = hash32_buf(name, namelen, HASH32_BUF_INIT);
903 1.1 dholland hash = hash32_buf(&dh, sizeof(dh), hash);
904 1.1 dholland return (hash % dh->dh_hlen);
905 1.1 dholland }
906 1.1 dholland
907 1.1 dholland /*
908 1.1 dholland * Adjust the number of free bytes in the block containing `offset'
909 1.1 dholland * by the value specified by `diff'.
910 1.1 dholland *
911 1.1 dholland * The caller must ensure we have exclusive access to `dh'; normally
912 1.1 dholland * that means that dh_lock should be held, but this is also called
913 1.3 dholland * from ulfsdirhash_build() where exclusive access can be assumed.
914 1.1 dholland */
915 1.1 dholland static void
916 1.3 dholland ulfsdirhash_adjfree(struct dirhash *dh, doff_t offset, int diff, int dirblksiz)
917 1.1 dholland {
918 1.1 dholland int block, i, nfidx, ofidx;
919 1.1 dholland
920 1.1 dholland KASSERT(mutex_owned(&dh->dh_lock));
921 1.1 dholland
922 1.1 dholland /* Update the per-block summary info. */
923 1.1 dholland block = offset / dirblksiz;
924 1.1 dholland KASSERT(block < dh->dh_nblk && block < dh->dh_dirblks);
925 1.1 dholland ofidx = BLKFREE2IDX(dh->dh_blkfree[block]);
926 1.1 dholland dh->dh_blkfree[block] = (int)dh->dh_blkfree[block] + (diff / DIRALIGN);
927 1.1 dholland nfidx = BLKFREE2IDX(dh->dh_blkfree[block]);
928 1.1 dholland
929 1.1 dholland /* Update the `first free' list if necessary. */
930 1.1 dholland if (ofidx != nfidx) {
931 1.1 dholland /* If removing, scan forward for the next block. */
932 1.1 dholland if (dh->dh_firstfree[ofidx] == block) {
933 1.1 dholland for (i = block + 1; i < dh->dh_dirblks; i++)
934 1.1 dholland if (BLKFREE2IDX(dh->dh_blkfree[i]) == ofidx)
935 1.1 dholland break;
936 1.1 dholland dh->dh_firstfree[ofidx] = (i < dh->dh_dirblks) ? i : -1;
937 1.1 dholland }
938 1.1 dholland
939 1.1 dholland /* Make this the new `first free' if necessary */
940 1.1 dholland if (dh->dh_firstfree[nfidx] > block ||
941 1.1 dholland dh->dh_firstfree[nfidx] == -1)
942 1.1 dholland dh->dh_firstfree[nfidx] = block;
943 1.1 dholland }
944 1.1 dholland }
945 1.1 dholland
946 1.1 dholland /*
947 1.1 dholland * Find the specified name which should have the specified offset.
948 1.1 dholland * Returns a slot number, and panics on failure.
949 1.1 dholland *
950 1.1 dholland * `dh' must be locked on entry and remains so on return.
951 1.1 dholland */
952 1.1 dholland static int
953 1.3 dholland ulfsdirhash_findslot(struct dirhash *dh, const char *name, int namelen,
954 1.1 dholland doff_t offset)
955 1.1 dholland {
956 1.1 dholland int slot;
957 1.1 dholland
958 1.1 dholland KASSERT(mutex_owned(&dh->dh_lock));
959 1.1 dholland
960 1.1 dholland /* Find the entry. */
961 1.1 dholland KASSERT(dh->dh_hused < dh->dh_hlen);
962 1.3 dholland slot = ulfsdirhash_hash(dh, name, namelen);
963 1.1 dholland while (DH_ENTRY(dh, slot) != offset &&
964 1.1 dholland DH_ENTRY(dh, slot) != DIRHASH_EMPTY)
965 1.1 dholland slot = WRAPINCR(slot, dh->dh_hlen);
966 1.1 dholland if (DH_ENTRY(dh, slot) != offset)
967 1.3 dholland panic("ulfsdirhash_findslot: '%.*s' not found", namelen, name);
968 1.1 dholland
969 1.1 dholland return (slot);
970 1.1 dholland }
971 1.1 dholland
972 1.1 dholland /*
973 1.1 dholland * Remove the entry corresponding to the specified slot from the hash array.
974 1.1 dholland *
975 1.1 dholland * `dh' must be locked on entry and remains so on return.
976 1.1 dholland */
977 1.1 dholland static void
978 1.3 dholland ulfsdirhash_delslot(struct dirhash *dh, int slot)
979 1.1 dholland {
980 1.1 dholland int i;
981 1.1 dholland
982 1.1 dholland KASSERT(mutex_owned(&dh->dh_lock));
983 1.1 dholland
984 1.1 dholland /* Mark the entry as deleted. */
985 1.1 dholland DH_ENTRY(dh, slot) = DIRHASH_DEL;
986 1.1 dholland
987 1.1 dholland /* If this is the end of a chain of DIRHASH_DEL slots, remove them. */
988 1.1 dholland for (i = slot; DH_ENTRY(dh, i) == DIRHASH_DEL; )
989 1.1 dholland i = WRAPINCR(i, dh->dh_hlen);
990 1.1 dholland if (DH_ENTRY(dh, i) == DIRHASH_EMPTY) {
991 1.1 dholland i = WRAPDECR(i, dh->dh_hlen);
992 1.1 dholland while (DH_ENTRY(dh, i) == DIRHASH_DEL) {
993 1.1 dholland DH_ENTRY(dh, i) = DIRHASH_EMPTY;
994 1.1 dholland dh->dh_hused--;
995 1.1 dholland i = WRAPDECR(i, dh->dh_hlen);
996 1.1 dholland }
997 1.1 dholland KASSERT(dh->dh_hused >= 0);
998 1.1 dholland }
999 1.1 dholland }
1000 1.1 dholland
1001 1.1 dholland /*
1002 1.1 dholland * Given a directory entry and its offset, find the offset of the
1003 1.1 dholland * previous entry in the same DIRBLKSIZ-sized block. Returns an
1004 1.1 dholland * offset, or -1 if there is no previous entry in the block or some
1005 1.1 dholland * other problem occurred.
1006 1.1 dholland */
1007 1.1 dholland static doff_t
1008 1.4 dholland ulfsdirhash_getprev(struct lfs_direct *dirp, doff_t offset, int dirblksiz)
1009 1.1 dholland {
1010 1.4 dholland struct lfs_direct *dp;
1011 1.1 dholland char *blkbuf;
1012 1.1 dholland doff_t blkoff, prevoff;
1013 1.1 dholland int entrypos, i;
1014 1.1 dholland
1015 1.1 dholland blkoff = offset & ~(dirblksiz - 1); /* offset of start of block */
1016 1.1 dholland entrypos = offset & (dirblksiz - 1); /* entry relative to block */
1017 1.1 dholland blkbuf = (char *)dirp - entrypos;
1018 1.1 dholland prevoff = blkoff;
1019 1.1 dholland
1020 1.1 dholland /* If `offset' is the start of a block, there is no previous entry. */
1021 1.1 dholland if (entrypos == 0)
1022 1.1 dholland return (-1);
1023 1.1 dholland
1024 1.1 dholland /* Scan from the start of the block until we get to the entry. */
1025 1.1 dholland for (i = 0; i < entrypos; i += dp->d_reclen) {
1026 1.4 dholland dp = (struct lfs_direct *)(blkbuf + i);
1027 1.1 dholland if (dp->d_reclen == 0 || i + dp->d_reclen > entrypos)
1028 1.1 dholland return (-1); /* Corrupted directory. */
1029 1.1 dholland prevoff = blkoff + i;
1030 1.1 dholland }
1031 1.1 dholland return (prevoff);
1032 1.1 dholland }
1033 1.1 dholland
1034 1.1 dholland /*
1035 1.1 dholland * Try to free up `wanted' bytes by stealing memory from existing
1036 1.1 dholland * dirhashes. Returns zero with list locked if successful.
1037 1.1 dholland */
1038 1.1 dholland static int
1039 1.3 dholland ulfsdirhash_recycle(int wanted)
1040 1.1 dholland {
1041 1.1 dholland struct dirhash *dh;
1042 1.1 dholland doff_t **hash;
1043 1.1 dholland u_int8_t *blkfree;
1044 1.1 dholland int i, mem, narrays;
1045 1.1 dholland size_t hashsz, blkfreesz;
1046 1.1 dholland
1047 1.1 dholland DIRHASHLIST_LOCK();
1048 1.3 dholland while (wanted + ulfs_dirhashmem > ulfs_dirhashmaxmem) {
1049 1.1 dholland /* Find a dirhash, and lock it. */
1050 1.3 dholland if ((dh = TAILQ_FIRST(&ulfsdirhash_list)) == NULL) {
1051 1.1 dholland DIRHASHLIST_UNLOCK();
1052 1.1 dholland return (-1);
1053 1.1 dholland }
1054 1.1 dholland DIRHASH_LOCK(dh);
1055 1.1 dholland KASSERT(dh->dh_hash != NULL);
1056 1.1 dholland
1057 1.1 dholland /* Decrement the score; only recycle if it becomes zero. */
1058 1.1 dholland if (--dh->dh_score > 0) {
1059 1.1 dholland DIRHASH_UNLOCK(dh);
1060 1.1 dholland DIRHASHLIST_UNLOCK();
1061 1.1 dholland return (-1);
1062 1.1 dholland }
1063 1.1 dholland
1064 1.1 dholland /* Remove it from the list and detach its memory. */
1065 1.3 dholland TAILQ_REMOVE(&ulfsdirhash_list, dh, dh_list);
1066 1.1 dholland dh->dh_onlist = 0;
1067 1.1 dholland hash = dh->dh_hash;
1068 1.1 dholland hashsz = dh->dh_hashsz;
1069 1.1 dholland dh->dh_hash = NULL;
1070 1.1 dholland blkfree = dh->dh_blkfree;
1071 1.1 dholland blkfreesz = dh->dh_blkfreesz;
1072 1.1 dholland dh->dh_blkfree = NULL;
1073 1.1 dholland narrays = dh->dh_narrays;
1074 1.1 dholland mem = narrays * sizeof(*dh->dh_hash) +
1075 1.1 dholland narrays * DH_NBLKOFF * sizeof(**dh->dh_hash) +
1076 1.1 dholland dh->dh_nblk * sizeof(*dh->dh_blkfree);
1077 1.1 dholland
1078 1.1 dholland /* Unlock everything, free the detached memory. */
1079 1.1 dholland DIRHASH_UNLOCK(dh);
1080 1.1 dholland DIRHASHLIST_UNLOCK();
1081 1.1 dholland
1082 1.1 dholland for (i = 0; i < narrays; i++)
1083 1.1 dholland DIRHASH_BLKFREE(hash[i]);
1084 1.1 dholland kmem_free(hash, hashsz);
1085 1.1 dholland kmem_free(blkfree, blkfreesz);
1086 1.1 dholland
1087 1.1 dholland /* Account for the returned memory, and repeat if necessary. */
1088 1.1 dholland DIRHASHLIST_LOCK();
1089 1.3 dholland atomic_add_int(&ulfs_dirhashmem, -mem);
1090 1.1 dholland }
1091 1.1 dholland /* Success. */
1092 1.1 dholland return (0);
1093 1.1 dholland }
1094 1.1 dholland
1095 1.1 dholland static void
1096 1.3 dholland ulfsdirhash_sysctl_init(void)
1097 1.1 dholland {
1098 1.1 dholland const struct sysctlnode *rnode, *cnode;
1099 1.1 dholland
1100 1.3 dholland sysctl_createv(&ulfsdirhash_sysctl_log, 0, NULL, &rnode,
1101 1.1 dholland CTLFLAG_PERMANENT,
1102 1.3 dholland CTLTYPE_NODE, "ulfs",
1103 1.3 dholland SYSCTL_DESCR("ulfs"),
1104 1.1 dholland NULL, 0, NULL, 0,
1105 1.8 pooka CTL_VFS, CTL_CREATE, CTL_EOL);
1106 1.1 dholland
1107 1.3 dholland sysctl_createv(&ulfsdirhash_sysctl_log, 0, &rnode, &rnode,
1108 1.1 dholland CTLFLAG_PERMANENT,
1109 1.1 dholland CTLTYPE_NODE, "dirhash",
1110 1.1 dholland SYSCTL_DESCR("dirhash"),
1111 1.1 dholland NULL, 0, NULL, 0,
1112 1.1 dholland CTL_CREATE, CTL_EOL);
1113 1.1 dholland
1114 1.3 dholland sysctl_createv(&ulfsdirhash_sysctl_log, 0, &rnode, &cnode,
1115 1.1 dholland CTLFLAG_PERMANENT|CTLFLAG_READWRITE,
1116 1.1 dholland CTLTYPE_INT, "minblocks",
1117 1.1 dholland SYSCTL_DESCR("minimum hashed directory size in blocks"),
1118 1.3 dholland NULL, 0, &ulfs_dirhashminblks, 0,
1119 1.1 dholland CTL_CREATE, CTL_EOL);
1120 1.1 dholland
1121 1.3 dholland sysctl_createv(&ulfsdirhash_sysctl_log, 0, &rnode, &cnode,
1122 1.1 dholland CTLFLAG_PERMANENT|CTLFLAG_READWRITE,
1123 1.1 dholland CTLTYPE_INT, "maxmem",
1124 1.1 dholland SYSCTL_DESCR("maximum dirhash memory usage"),
1125 1.3 dholland NULL, 0, &ulfs_dirhashmaxmem, 0,
1126 1.1 dholland CTL_CREATE, CTL_EOL);
1127 1.1 dholland
1128 1.3 dholland sysctl_createv(&ulfsdirhash_sysctl_log, 0, &rnode, &cnode,
1129 1.1 dholland CTLFLAG_PERMANENT|CTLFLAG_READONLY,
1130 1.1 dholland CTLTYPE_INT, "memused",
1131 1.1 dholland SYSCTL_DESCR("current dirhash memory usage"),
1132 1.3 dholland NULL, 0, &ulfs_dirhashmem, 0,
1133 1.1 dholland CTL_CREATE, CTL_EOL);
1134 1.1 dholland
1135 1.3 dholland sysctl_createv(&ulfsdirhash_sysctl_log, 0, &rnode, &cnode,
1136 1.1 dholland CTLFLAG_PERMANENT|CTLFLAG_READWRITE,
1137 1.1 dholland CTLTYPE_INT, "docheck",
1138 1.1 dholland SYSCTL_DESCR("enable extra sanity checks"),
1139 1.3 dholland NULL, 0, &ulfs_dirhashcheck, 0,
1140 1.1 dholland CTL_CREATE, CTL_EOL);
1141 1.1 dholland }
1142 1.1 dholland
1143 1.1 dholland void
1144 1.3 dholland ulfsdirhash_init(void)
1145 1.1 dholland {
1146 1.1 dholland
1147 1.3 dholland mutex_init(&ulfsdirhash_lock, MUTEX_DEFAULT, IPL_NONE);
1148 1.3 dholland ulfsdirhashblk_cache = pool_cache_init(DH_NBLKOFF * sizeof(daddr_t), 0,
1149 1.1 dholland 0, 0, "dirhashblk", NULL, IPL_NONE, NULL, NULL, NULL);
1150 1.3 dholland ulfsdirhash_cache = pool_cache_init(sizeof(struct dirhash), 0,
1151 1.1 dholland 0, 0, "dirhash", NULL, IPL_NONE, NULL, NULL, NULL);
1152 1.3 dholland TAILQ_INIT(&ulfsdirhash_list);
1153 1.3 dholland ulfsdirhash_sysctl_init();
1154 1.1 dholland }
1155 1.1 dholland
1156 1.1 dholland void
1157 1.3 dholland ulfsdirhash_done(void)
1158 1.1 dholland {
1159 1.1 dholland
1160 1.3 dholland KASSERT(TAILQ_EMPTY(&ulfsdirhash_list));
1161 1.3 dholland pool_cache_destroy(ulfsdirhashblk_cache);
1162 1.3 dholland pool_cache_destroy(ulfsdirhash_cache);
1163 1.3 dholland mutex_destroy(&ulfsdirhash_lock);
1164 1.3 dholland sysctl_teardown(&ulfsdirhash_sysctl_log);
1165 1.1 dholland }
1166