subr_vmem.c revision 1.36.2.1 1 1.36.2.1 yamt /* $NetBSD: subr_vmem.c,v 1.36.2.1 2007/12/10 12:56:11 yamt Exp $ */
2 1.1 yamt
3 1.1 yamt /*-
4 1.36.2.1 yamt * Copyright (c)2006, 2007 YAMAMOTO Takashi,
5 1.1 yamt * All rights reserved.
6 1.1 yamt *
7 1.1 yamt * Redistribution and use in source and binary forms, with or without
8 1.1 yamt * modification, are permitted provided that the following conditions
9 1.1 yamt * are met:
10 1.1 yamt * 1. Redistributions of source code must retain the above copyright
11 1.1 yamt * notice, this list of conditions and the following disclaimer.
12 1.1 yamt * 2. Redistributions in binary form must reproduce the above copyright
13 1.1 yamt * notice, this list of conditions and the following disclaimer in the
14 1.1 yamt * documentation and/or other materials provided with the distribution.
15 1.1 yamt *
16 1.1 yamt * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
17 1.1 yamt * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18 1.1 yamt * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19 1.1 yamt * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
20 1.1 yamt * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21 1.1 yamt * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
22 1.1 yamt * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23 1.1 yamt * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
24 1.1 yamt * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25 1.1 yamt * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26 1.1 yamt * SUCH DAMAGE.
27 1.1 yamt */
28 1.1 yamt
29 1.1 yamt /*
30 1.1 yamt * reference:
31 1.1 yamt * - Magazines and Vmem: Extending the Slab Allocator
32 1.1 yamt * to Many CPUs and Arbitrary Resources
33 1.1 yamt * http://www.usenix.org/event/usenix01/bonwick.html
34 1.18 yamt *
35 1.18 yamt * todo:
36 1.18 yamt * - decide how to import segments for vmem_xalloc.
37 1.1 yamt */
38 1.1 yamt
39 1.1 yamt #include <sys/cdefs.h>
40 1.36.2.1 yamt __KERNEL_RCSID(0, "$NetBSD: subr_vmem.c,v 1.36.2.1 2007/12/10 12:56:11 yamt Exp $");
41 1.1 yamt
42 1.1 yamt #define VMEM_DEBUG
43 1.5 yamt #if defined(_KERNEL)
44 1.5 yamt #define QCACHE
45 1.5 yamt #endif /* defined(_KERNEL) */
46 1.1 yamt
47 1.1 yamt #include <sys/param.h>
48 1.1 yamt #include <sys/hash.h>
49 1.1 yamt #include <sys/queue.h>
50 1.1 yamt
51 1.1 yamt #if defined(_KERNEL)
52 1.1 yamt #include <sys/systm.h>
53 1.30 yamt #include <sys/kernel.h> /* hz */
54 1.30 yamt #include <sys/callout.h>
55 1.1 yamt #include <sys/lock.h>
56 1.1 yamt #include <sys/once.h>
57 1.1 yamt #include <sys/pool.h>
58 1.3 yamt #include <sys/proc.h>
59 1.1 yamt #include <sys/vmem.h>
60 1.36.2.1 yamt #include <sys/kmem.h>
61 1.30 yamt #include <sys/workqueue.h>
62 1.36.2.1 yamt
63 1.36.2.1 yamt #include <uvm/uvm_extern.h>
64 1.36.2.1 yamt #include <uvm/uvm_map.h>
65 1.36.2.1 yamt #include <uvm/uvm_pdaemon.h>
66 1.1 yamt #else /* defined(_KERNEL) */
67 1.1 yamt #include "../sys/vmem.h"
68 1.1 yamt #endif /* defined(_KERNEL) */
69 1.1 yamt
70 1.1 yamt #if defined(_KERNEL)
71 1.31 ad #define LOCK_DECL(name) kmutex_t name
72 1.1 yamt #else /* defined(_KERNEL) */
73 1.1 yamt #include <errno.h>
74 1.1 yamt #include <assert.h>
75 1.1 yamt #include <stdlib.h>
76 1.1 yamt
77 1.1 yamt #define KASSERT(a) assert(a)
78 1.31 ad #define LOCK_DECL(name) /* nothing */
79 1.31 ad #define mutex_init(a, b, c) /* nothing */
80 1.31 ad #define mutex_destroy(a) /* nothing */
81 1.31 ad #define mutex_enter(a) /* nothing */
82 1.31 ad #define mutex_exit(a) /* nothing */
83 1.31 ad #define mutex_owned(a) /* nothing */
84 1.3 yamt #define ASSERT_SLEEPABLE(lk, msg) /* nothing */
85 1.31 ad #define IPL_VM 0
86 1.1 yamt #endif /* defined(_KERNEL) */
87 1.1 yamt
88 1.1 yamt struct vmem;
89 1.1 yamt struct vmem_btag;
90 1.1 yamt
91 1.1 yamt #if defined(VMEM_DEBUG)
92 1.1 yamt void vmem_dump(const vmem_t *);
93 1.36.2.1 yamt void vmem_dump_seglist(const vmem_t *);
94 1.36.2.1 yamt void vmem_dump_freelist(const vmem_t *);
95 1.36.2.1 yamt #if defined(QCACHE)
96 1.36.2.1 yamt void vmem_dump_qc(const vmem_t *);
97 1.36.2.1 yamt #endif /* defined(QCACHE) */
98 1.1 yamt #endif /* defined(VMEM_DEBUG) */
99 1.1 yamt
100 1.4 yamt #define VMEM_MAXORDER (sizeof(vmem_size_t) * CHAR_BIT)
101 1.30 yamt
102 1.30 yamt #define VMEM_HASHSIZE_MIN 1 /* XXX */
103 1.30 yamt #define VMEM_HASHSIZE_MAX 8192 /* XXX */
104 1.30 yamt #define VMEM_HASHSIZE_INIT VMEM_HASHSIZE_MIN
105 1.1 yamt
106 1.1 yamt #define VM_FITMASK (VM_BESTFIT | VM_INSTANTFIT)
107 1.1 yamt
108 1.36.2.1 yamt /* vm_flag_t (internal uses) */
109 1.36.2.1 yamt #define VM_BTPAGE 0x00008000
110 1.36.2.1 yamt
111 1.1 yamt CIRCLEQ_HEAD(vmem_seglist, vmem_btag);
112 1.1 yamt LIST_HEAD(vmem_freelist, vmem_btag);
113 1.1 yamt LIST_HEAD(vmem_hashlist, vmem_btag);
114 1.36.2.1 yamt typedef struct vmem_hashlist vmem_hashlist_t;
115 1.1 yamt
116 1.5 yamt #if defined(QCACHE)
117 1.5 yamt #define VMEM_QCACHE_IDX_MAX 32
118 1.5 yamt
119 1.5 yamt #define QC_NAME_MAX 16
120 1.5 yamt
121 1.5 yamt struct qcache {
122 1.35 ad pool_cache_t qc_cache;
123 1.5 yamt vmem_t *qc_vmem;
124 1.5 yamt char qc_name[QC_NAME_MAX];
125 1.5 yamt };
126 1.5 yamt typedef struct qcache qcache_t;
127 1.35 ad #define QC_POOL_TO_QCACHE(pool) ((qcache_t *)(pool->pr_qcache))
128 1.5 yamt #endif /* defined(QCACHE) */
129 1.5 yamt
130 1.1 yamt /* vmem arena */
131 1.1 yamt struct vmem {
132 1.31 ad LOCK_DECL(vm_lock);
133 1.36.2.1 yamt vm_flag_t vm_flags;
134 1.36.2.1 yamt int vm_freetags;
135 1.1 yamt vmem_addr_t (*vm_allocfn)(vmem_t *, vmem_size_t, vmem_size_t *,
136 1.1 yamt vm_flag_t);
137 1.1 yamt void (*vm_freefn)(vmem_t *, vmem_addr_t, vmem_size_t);
138 1.1 yamt vmem_t *vm_source;
139 1.1 yamt struct vmem_seglist vm_seglist;
140 1.1 yamt struct vmem_freelist vm_freelist[VMEM_MAXORDER];
141 1.36.2.1 yamt LIST_HEAD(, btpage_header) vm_btpagelist;
142 1.1 yamt size_t vm_hashsize;
143 1.1 yamt size_t vm_nbusytag;
144 1.36.2.1 yamt vmem_hashlist_t *vm_hashlist;
145 1.1 yamt size_t vm_quantum_mask;
146 1.1 yamt int vm_quantum_shift;
147 1.1 yamt const char *vm_name;
148 1.30 yamt LIST_ENTRY(vmem) vm_alllist;
149 1.5 yamt
150 1.5 yamt #if defined(QCACHE)
151 1.5 yamt /* quantum cache */
152 1.5 yamt size_t vm_qcache_max;
153 1.5 yamt struct pool_allocator vm_qcache_allocator;
154 1.22 yamt qcache_t vm_qcache_store[VMEM_QCACHE_IDX_MAX];
155 1.22 yamt qcache_t *vm_qcache[VMEM_QCACHE_IDX_MAX];
156 1.5 yamt #endif /* defined(QCACHE) */
157 1.1 yamt };
158 1.1 yamt
159 1.31 ad #define VMEM_LOCK(vm) mutex_enter(&vm->vm_lock)
160 1.31 ad #define VMEM_TRYLOCK(vm) mutex_tryenter(&vm->vm_lock)
161 1.31 ad #define VMEM_UNLOCK(vm) mutex_exit(&vm->vm_lock)
162 1.36 ad #define VMEM_LOCK_INIT(vm, ipl) mutex_init(&vm->vm_lock, MUTEX_DEFAULT, ipl)
163 1.31 ad #define VMEM_LOCK_DESTROY(vm) mutex_destroy(&vm->vm_lock)
164 1.31 ad #define VMEM_ASSERT_LOCKED(vm) KASSERT(mutex_owned(&vm->vm_lock))
165 1.1 yamt
166 1.36.2.1 yamt #define vmem_bootstrap_p(vm) (((vm)->vm_flags & VMC_KVA) != 0)
167 1.36.2.1 yamt
168 1.1 yamt /* boundary tag */
169 1.1 yamt struct vmem_btag {
170 1.1 yamt CIRCLEQ_ENTRY(vmem_btag) bt_seglist;
171 1.1 yamt union {
172 1.1 yamt LIST_ENTRY(vmem_btag) u_freelist; /* BT_TYPE_FREE */
173 1.1 yamt LIST_ENTRY(vmem_btag) u_hashlist; /* BT_TYPE_BUSY */
174 1.36.2.1 yamt SLIST_ENTRY(vmem_btag) u_sfreelist; /* in btpage_header */
175 1.36.2.1 yamt SLIST_ENTRY(vmem_btag) u_tmplist; /* temp use in vmem_xfree */
176 1.1 yamt } bt_u;
177 1.1 yamt #define bt_hashlist bt_u.u_hashlist
178 1.1 yamt #define bt_freelist bt_u.u_freelist
179 1.36.2.1 yamt #define bt_sfreelist bt_u.u_sfreelist
180 1.36.2.1 yamt #define bt_tmplist bt_u.u_tmplist
181 1.1 yamt vmem_addr_t bt_start;
182 1.1 yamt vmem_size_t bt_size;
183 1.1 yamt int bt_type;
184 1.1 yamt };
185 1.1 yamt
186 1.1 yamt #define BT_TYPE_SPAN 1
187 1.1 yamt #define BT_TYPE_SPAN_STATIC 2
188 1.1 yamt #define BT_TYPE_FREE 3
189 1.1 yamt #define BT_TYPE_BUSY 4
190 1.1 yamt #define BT_ISSPAN_P(bt) ((bt)->bt_type <= BT_TYPE_SPAN_STATIC)
191 1.1 yamt
192 1.1 yamt #define BT_END(bt) ((bt)->bt_start + (bt)->bt_size)
193 1.1 yamt
194 1.1 yamt typedef struct vmem_btag bt_t;
195 1.1 yamt
196 1.1 yamt /* ---- misc */
197 1.1 yamt
198 1.19 yamt #define VMEM_ALIGNUP(addr, align) \
199 1.19 yamt (-(-(addr) & -(align)))
200 1.19 yamt #define VMEM_CROSS_P(addr1, addr2, boundary) \
201 1.19 yamt ((((addr1) ^ (addr2)) & -(boundary)) != 0)
202 1.19 yamt
203 1.4 yamt #define ORDER2SIZE(order) ((vmem_size_t)1 << (order))
204 1.4 yamt
205 1.1 yamt static int
206 1.1 yamt calc_order(vmem_size_t size)
207 1.1 yamt {
208 1.4 yamt vmem_size_t target;
209 1.1 yamt int i;
210 1.1 yamt
211 1.1 yamt KASSERT(size != 0);
212 1.1 yamt
213 1.1 yamt i = 0;
214 1.4 yamt target = size >> 1;
215 1.4 yamt while (ORDER2SIZE(i) <= target) {
216 1.1 yamt i++;
217 1.1 yamt }
218 1.1 yamt
219 1.4 yamt KASSERT(ORDER2SIZE(i) <= size);
220 1.4 yamt KASSERT(size < ORDER2SIZE(i + 1) || ORDER2SIZE(i + 1) < ORDER2SIZE(i));
221 1.1 yamt
222 1.1 yamt return i;
223 1.1 yamt }
224 1.1 yamt
225 1.1 yamt static void *
226 1.1 yamt xmalloc(size_t sz, vm_flag_t flags)
227 1.1 yamt {
228 1.1 yamt
229 1.1 yamt #if defined(_KERNEL)
230 1.36.2.1 yamt return kmem_alloc(sz, (flags & VM_SLEEP) ? KM_SLEEP : KM_NOSLEEP);
231 1.1 yamt #else /* defined(_KERNEL) */
232 1.1 yamt return malloc(sz);
233 1.1 yamt #endif /* defined(_KERNEL) */
234 1.1 yamt }
235 1.1 yamt
236 1.1 yamt static void
237 1.36.2.1 yamt xfree(void *p, size_t sz)
238 1.1 yamt {
239 1.1 yamt
240 1.1 yamt #if defined(_KERNEL)
241 1.36.2.1 yamt kmem_free(p, sz);
242 1.1 yamt #else /* defined(_KERNEL) */
243 1.1 yamt return free(p);
244 1.1 yamt #endif /* defined(_KERNEL) */
245 1.1 yamt }
246 1.1 yamt
247 1.36.2.1 yamt /* ---- static storage for bootstrap */
248 1.36.2.1 yamt
249 1.36.2.1 yamt #define STATIC_POOL_NAME(type) static_ ## type
250 1.36.2.1 yamt #define STATIC_POOL_IDX(type) static_ ## type ## _idx
251 1.36.2.1 yamt #define STATIC_POOL_DEFINE(type, n) \
252 1.36.2.1 yamt type STATIC_POOL_NAME(type)[(n)] __unused ; \
253 1.36.2.1 yamt int STATIC_POOL_IDX(type) __unused
254 1.36.2.1 yamt #define STATIC_POOL_ALLOC(var, type) \
255 1.36.2.1 yamt (var) = &STATIC_POOL_NAME(type)[STATIC_POOL_IDX(type)++]; \
256 1.36.2.1 yamt KASSERT(STATIC_POOL_ELEM_P(type, var))
257 1.36.2.1 yamt #define STATIC_POOL_FREE(type, var) \
258 1.36.2.1 yamt KASSERT(STATIC_POOL_ELEM_P(type, var)); \
259 1.36.2.1 yamt KASSERT((var) == &STATIC_POOL_NAME(type)[STATIC_POOL_IDX(type)-1]); \
260 1.36.2.1 yamt STATIC_POOL_IDX(type)--
261 1.36.2.1 yamt #define STATIC_POOL_ELEM_P(type, var) \
262 1.36.2.1 yamt (&STATIC_POOL_NAME(type)[0] <= (var) && \
263 1.36.2.1 yamt (var) < &STATIC_POOL_NAME(type)[__arraycount(STATIC_POOL_NAME(type))])
264 1.36.2.1 yamt
265 1.36.2.1 yamt static STATIC_POOL_DEFINE(bt_t, 3);
266 1.36.2.1 yamt static STATIC_POOL_DEFINE(vmem_t, 2);
267 1.36.2.1 yamt static STATIC_POOL_DEFINE(vmem_hashlist_t, 2);
268 1.36.2.1 yamt typedef struct pool_cache vmem_pool_cache_t; /* XXX */
269 1.36.2.1 yamt static STATIC_POOL_DEFINE(vmem_pool_cache_t, VMEM_QCACHE_IDX_MAX+1);
270 1.36.2.1 yamt
271 1.1 yamt /* ---- boundary tag */
272 1.1 yamt
273 1.1 yamt #if defined(_KERNEL)
274 1.35 ad static struct pool_cache bt_cache;
275 1.1 yamt #endif /* defined(_KERNEL) */
276 1.1 yamt
277 1.36.2.1 yamt struct btpage_header {
278 1.36.2.1 yamt LIST_ENTRY(btpage_header) bh_q;
279 1.36.2.1 yamt int bh_nfree;
280 1.36.2.1 yamt SLIST_HEAD(, vmem_btag) bh_freelist;
281 1.36.2.1 yamt bt_t bh_bt[];
282 1.36.2.1 yamt };
283 1.36.2.1 yamt typedef struct btpage_header btpage_header_t;
284 1.36.2.1 yamt
285 1.36.2.1 yamt #define BT_PER_PAGE \
286 1.36.2.1 yamt ((PAGE_SIZE - sizeof(btpage_header_t)) / sizeof(bt_t))
287 1.36.2.1 yamt
288 1.36.2.1 yamt static int
289 1.36.2.1 yamt btpage_alloc(vmem_t *vm, vm_flag_t flags)
290 1.36.2.1 yamt {
291 1.36.2.1 yamt vmem_addr_t va;
292 1.36.2.1 yamt
293 1.36.2.1 yamt va = vmem_xalloc(vm, PAGE_SIZE, PAGE_SIZE, 0, 0, 0, 0,
294 1.36.2.1 yamt (flags & ~VM_FITMASK) | VM_INSTANTFIT | VM_BTPAGE);
295 1.36.2.1 yamt if (va == 0) {
296 1.36.2.1 yamt return ENOMEM;
297 1.36.2.1 yamt }
298 1.36.2.1 yamt return 0;
299 1.36.2.1 yamt }
300 1.36.2.1 yamt
301 1.36.2.1 yamt static void
302 1.36.2.1 yamt btpage_init(vmem_t *vm, struct vm_page *pg, vaddr_t va)
303 1.36.2.1 yamt {
304 1.36.2.1 yamt btpage_header_t *bh;
305 1.36.2.1 yamt int i;
306 1.36.2.1 yamt
307 1.36.2.1 yamt VMEM_ASSERT_LOCKED(vm);
308 1.36.2.1 yamt KASSERT((va & PAGE_MASK) == 0);
309 1.36.2.1 yamt pmap_kenter_pa(va, VM_PAGE_TO_PHYS(pg), VM_PROT_READ|VM_PROT_WRITE);
310 1.36.2.1 yamt pmap_update(pmap_kernel());
311 1.36.2.1 yamt bh = (void *)va;
312 1.36.2.1 yamt SLIST_INIT(&bh->bh_freelist);
313 1.36.2.1 yamt for (i = 0; i < BT_PER_PAGE; i++) {
314 1.36.2.1 yamt SLIST_INSERT_HEAD(&bh->bh_freelist, &bh->bh_bt[i],
315 1.36.2.1 yamt bt_sfreelist);
316 1.36.2.1 yamt }
317 1.36.2.1 yamt LIST_INSERT_HEAD(&vm->vm_btpagelist, bh, bh_q);
318 1.36.2.1 yamt bh->bh_nfree = BT_PER_PAGE;
319 1.36.2.1 yamt vm->vm_freetags += bh->bh_nfree;
320 1.36.2.1 yamt }
321 1.36.2.1 yamt
322 1.36.2.1 yamt static void
323 1.36.2.1 yamt btpage_free(vmem_t *vm, btpage_header_t *bh)
324 1.36.2.1 yamt {
325 1.36.2.1 yamt
326 1.36.2.1 yamt KASSERT(vmem_bootstrap_p(vm));
327 1.36.2.1 yamt pmap_kremove((vaddr_t)bh, PAGE_SIZE);
328 1.36.2.1 yamt pmap_update(pmap_kernel());
329 1.36.2.1 yamt vmem_xfree(vm, (vmem_addr_t)bh, PAGE_SIZE);
330 1.36.2.1 yamt }
331 1.36.2.1 yamt
332 1.36.2.1 yamt static btpage_header_t *
333 1.36.2.1 yamt btpage_lookup(bt_t *bt)
334 1.36.2.1 yamt {
335 1.36.2.1 yamt
336 1.36.2.1 yamt return (void *)trunc_page((vaddr_t)bt);
337 1.36.2.1 yamt }
338 1.36.2.1 yamt
339 1.36.2.1 yamt static bt_t *
340 1.36.2.1 yamt bt_alloc_bootstrap(vmem_t *vm)
341 1.36.2.1 yamt {
342 1.36.2.1 yamt btpage_header_t *bh;
343 1.36.2.1 yamt bt_t *bt;
344 1.36.2.1 yamt
345 1.36.2.1 yamt KASSERT(vmem_bootstrap_p(vm));
346 1.36.2.1 yamt VMEM_ASSERT_LOCKED(vm);
347 1.36.2.1 yamt bh = LIST_FIRST(&vm->vm_btpagelist);
348 1.36.2.1 yamt if (__predict_false(bh == NULL)) {
349 1.36.2.1 yamt STATIC_POOL_ALLOC(bt, bt_t);
350 1.36.2.1 yamt return bt;
351 1.36.2.1 yamt }
352 1.36.2.1 yamt KASSERT(bh->bh_nfree > 0);
353 1.36.2.1 yamt bt = SLIST_FIRST(&bh->bh_freelist);
354 1.36.2.1 yamt KASSERT(bt != NULL);
355 1.36.2.1 yamt SLIST_REMOVE_HEAD(&bh->bh_freelist, bt_sfreelist);
356 1.36.2.1 yamt bh->bh_nfree--;
357 1.36.2.1 yamt vm->vm_freetags--;
358 1.36.2.1 yamt if (SLIST_EMPTY(&bh->bh_freelist)) {
359 1.36.2.1 yamt KASSERT(bh->bh_nfree == 0);
360 1.36.2.1 yamt LIST_REMOVE(bh, bh_q);
361 1.36.2.1 yamt }
362 1.36.2.1 yamt return bt;
363 1.36.2.1 yamt }
364 1.36.2.1 yamt
365 1.36.2.1 yamt #define BT_MINRESERVE 1
366 1.36.2.1 yamt
367 1.1 yamt static bt_t *
368 1.17 yamt bt_alloc(vmem_t *vm, vm_flag_t flags)
369 1.1 yamt {
370 1.1 yamt bt_t *bt;
371 1.1 yamt
372 1.1 yamt #if defined(_KERNEL)
373 1.36.2.1 yamt if (vmem_bootstrap_p(vm)) {
374 1.36.2.1 yamt again:
375 1.36.2.1 yamt VMEM_LOCK(vm);
376 1.36.2.1 yamt if (vm->vm_freetags <= BT_MINRESERVE &&
377 1.36.2.1 yamt (flags & VM_BTPAGE) == 0) {
378 1.36.2.1 yamt VMEM_UNLOCK(vm);
379 1.36.2.1 yamt if (btpage_alloc(vm, flags)) {
380 1.36.2.1 yamt return NULL;
381 1.36.2.1 yamt }
382 1.36.2.1 yamt goto again;
383 1.36.2.1 yamt }
384 1.36.2.1 yamt bt = bt_alloc_bootstrap(vm);
385 1.36.2.1 yamt VMEM_UNLOCK(vm);
386 1.36.2.1 yamt } else {
387 1.36.2.1 yamt bt = pool_cache_get(&bt_cache,
388 1.36.2.1 yamt (flags & VM_SLEEP) != 0 ? PR_WAITOK : PR_NOWAIT);
389 1.36.2.1 yamt }
390 1.1 yamt #else /* defined(_KERNEL) */
391 1.1 yamt bt = malloc(sizeof *bt);
392 1.1 yamt #endif /* defined(_KERNEL) */
393 1.1 yamt
394 1.1 yamt return bt;
395 1.1 yamt }
396 1.1 yamt
397 1.1 yamt static void
398 1.17 yamt bt_free(vmem_t *vm, bt_t *bt)
399 1.1 yamt {
400 1.1 yamt
401 1.36.2.1 yamt KASSERT(bt != NULL);
402 1.36.2.1 yamt KASSERT(!STATIC_POOL_ELEM_P(bt_t, bt));
403 1.1 yamt #if defined(_KERNEL)
404 1.36.2.1 yamt if (vmem_bootstrap_p(vm)) {
405 1.36.2.1 yamt btpage_header_t *bh;
406 1.36.2.1 yamt
407 1.36.2.1 yamt bh = btpage_lookup(bt);
408 1.36.2.1 yamt VMEM_LOCK(vm);
409 1.36.2.1 yamt if (SLIST_EMPTY(&bh->bh_freelist)) {
410 1.36.2.1 yamt KASSERT(bh->bh_nfree == 0);
411 1.36.2.1 yamt LIST_INSERT_HEAD(&vm->vm_btpagelist, bh, bh_q);
412 1.36.2.1 yamt }
413 1.36.2.1 yamt SLIST_INSERT_HEAD(&bh->bh_freelist, bt, bt_sfreelist);
414 1.36.2.1 yamt bh->bh_nfree++;
415 1.36.2.1 yamt vm->vm_freetags++;
416 1.36.2.1 yamt if (vm->vm_freetags >= BT_PER_PAGE + BT_MINRESERVE &&
417 1.36.2.1 yamt bh->bh_nfree == BT_PER_PAGE) {
418 1.36.2.1 yamt LIST_REMOVE(bh, bh_q);
419 1.36.2.1 yamt vm->vm_freetags -= BT_PER_PAGE;
420 1.36.2.1 yamt VMEM_UNLOCK(vm);
421 1.36.2.1 yamt btpage_free(vm, bh);
422 1.36.2.1 yamt } else {
423 1.36.2.1 yamt VMEM_UNLOCK(vm);
424 1.36.2.1 yamt }
425 1.36.2.1 yamt } else {
426 1.36.2.1 yamt pool_cache_put(&bt_cache, bt);
427 1.36.2.1 yamt }
428 1.1 yamt #else /* defined(_KERNEL) */
429 1.1 yamt free(bt);
430 1.1 yamt #endif /* defined(_KERNEL) */
431 1.1 yamt }
432 1.1 yamt
433 1.1 yamt /*
434 1.1 yamt * freelist[0] ... [1, 1]
435 1.1 yamt * freelist[1] ... [2, 3]
436 1.1 yamt * freelist[2] ... [4, 7]
437 1.1 yamt * freelist[3] ... [8, 15]
438 1.1 yamt * :
439 1.1 yamt * freelist[n] ... [(1 << n), (1 << (n + 1)) - 1]
440 1.1 yamt * :
441 1.1 yamt */
442 1.1 yamt
443 1.1 yamt static struct vmem_freelist *
444 1.1 yamt bt_freehead_tofree(vmem_t *vm, vmem_size_t size)
445 1.1 yamt {
446 1.1 yamt const vmem_size_t qsize = size >> vm->vm_quantum_shift;
447 1.1 yamt int idx;
448 1.1 yamt
449 1.1 yamt KASSERT((size & vm->vm_quantum_mask) == 0);
450 1.1 yamt KASSERT(size != 0);
451 1.1 yamt
452 1.1 yamt idx = calc_order(qsize);
453 1.1 yamt KASSERT(idx >= 0);
454 1.1 yamt KASSERT(idx < VMEM_MAXORDER);
455 1.1 yamt
456 1.1 yamt return &vm->vm_freelist[idx];
457 1.1 yamt }
458 1.1 yamt
459 1.1 yamt static struct vmem_freelist *
460 1.1 yamt bt_freehead_toalloc(vmem_t *vm, vmem_size_t size, vm_flag_t strat)
461 1.1 yamt {
462 1.1 yamt const vmem_size_t qsize = size >> vm->vm_quantum_shift;
463 1.1 yamt int idx;
464 1.1 yamt
465 1.1 yamt KASSERT((size & vm->vm_quantum_mask) == 0);
466 1.1 yamt KASSERT(size != 0);
467 1.1 yamt
468 1.1 yamt idx = calc_order(qsize);
469 1.4 yamt if (strat == VM_INSTANTFIT && ORDER2SIZE(idx) != qsize) {
470 1.1 yamt idx++;
471 1.1 yamt /* check too large request? */
472 1.1 yamt }
473 1.1 yamt KASSERT(idx >= 0);
474 1.1 yamt KASSERT(idx < VMEM_MAXORDER);
475 1.1 yamt
476 1.1 yamt return &vm->vm_freelist[idx];
477 1.1 yamt }
478 1.1 yamt
479 1.1 yamt /* ---- boundary tag hash */
480 1.1 yamt
481 1.36.2.1 yamt static vmem_hashlist_t *
482 1.1 yamt bt_hashhead(vmem_t *vm, vmem_addr_t addr)
483 1.1 yamt {
484 1.36.2.1 yamt vmem_hashlist_t *list;
485 1.1 yamt unsigned int hash;
486 1.1 yamt
487 1.1 yamt hash = hash32_buf(&addr, sizeof(addr), HASH32_BUF_INIT);
488 1.1 yamt list = &vm->vm_hashlist[hash % vm->vm_hashsize];
489 1.1 yamt
490 1.1 yamt return list;
491 1.1 yamt }
492 1.1 yamt
493 1.1 yamt static bt_t *
494 1.1 yamt bt_lookupbusy(vmem_t *vm, vmem_addr_t addr)
495 1.1 yamt {
496 1.36.2.1 yamt vmem_hashlist_t *list;
497 1.1 yamt bt_t *bt;
498 1.1 yamt
499 1.1 yamt list = bt_hashhead(vm, addr);
500 1.1 yamt LIST_FOREACH(bt, list, bt_hashlist) {
501 1.1 yamt if (bt->bt_start == addr) {
502 1.1 yamt break;
503 1.1 yamt }
504 1.1 yamt }
505 1.1 yamt
506 1.1 yamt return bt;
507 1.1 yamt }
508 1.1 yamt
509 1.1 yamt static void
510 1.1 yamt bt_rembusy(vmem_t *vm, bt_t *bt)
511 1.1 yamt {
512 1.1 yamt
513 1.1 yamt KASSERT(vm->vm_nbusytag > 0);
514 1.1 yamt vm->vm_nbusytag--;
515 1.1 yamt LIST_REMOVE(bt, bt_hashlist);
516 1.1 yamt }
517 1.1 yamt
518 1.1 yamt static void
519 1.1 yamt bt_insbusy(vmem_t *vm, bt_t *bt)
520 1.1 yamt {
521 1.36.2.1 yamt vmem_hashlist_t *list;
522 1.1 yamt
523 1.1 yamt KASSERT(bt->bt_type == BT_TYPE_BUSY);
524 1.1 yamt
525 1.1 yamt list = bt_hashhead(vm, bt->bt_start);
526 1.1 yamt LIST_INSERT_HEAD(list, bt, bt_hashlist);
527 1.1 yamt vm->vm_nbusytag++;
528 1.1 yamt }
529 1.1 yamt
530 1.1 yamt /* ---- boundary tag list */
531 1.1 yamt
532 1.1 yamt static void
533 1.1 yamt bt_remseg(vmem_t *vm, bt_t *bt)
534 1.1 yamt {
535 1.1 yamt
536 1.1 yamt CIRCLEQ_REMOVE(&vm->vm_seglist, bt, bt_seglist);
537 1.1 yamt }
538 1.1 yamt
539 1.1 yamt static void
540 1.1 yamt bt_insseg(vmem_t *vm, bt_t *bt, bt_t *prev)
541 1.1 yamt {
542 1.1 yamt
543 1.1 yamt CIRCLEQ_INSERT_AFTER(&vm->vm_seglist, prev, bt, bt_seglist);
544 1.1 yamt }
545 1.1 yamt
546 1.1 yamt static void
547 1.1 yamt bt_insseg_tail(vmem_t *vm, bt_t *bt)
548 1.1 yamt {
549 1.1 yamt
550 1.1 yamt CIRCLEQ_INSERT_TAIL(&vm->vm_seglist, bt, bt_seglist);
551 1.1 yamt }
552 1.1 yamt
553 1.1 yamt static void
554 1.17 yamt bt_remfree(vmem_t *vm, bt_t *bt)
555 1.1 yamt {
556 1.1 yamt
557 1.1 yamt KASSERT(bt->bt_type == BT_TYPE_FREE);
558 1.1 yamt
559 1.1 yamt LIST_REMOVE(bt, bt_freelist);
560 1.1 yamt }
561 1.1 yamt
562 1.1 yamt static void
563 1.1 yamt bt_insfree(vmem_t *vm, bt_t *bt)
564 1.1 yamt {
565 1.1 yamt struct vmem_freelist *list;
566 1.1 yamt
567 1.1 yamt list = bt_freehead_tofree(vm, bt->bt_size);
568 1.1 yamt LIST_INSERT_HEAD(list, bt, bt_freelist);
569 1.1 yamt }
570 1.1 yamt
571 1.1 yamt /* ---- vmem internal functions */
572 1.1 yamt
573 1.30 yamt #if defined(_KERNEL)
574 1.30 yamt static kmutex_t vmem_list_lock;
575 1.30 yamt static LIST_HEAD(, vmem) vmem_list = LIST_HEAD_INITIALIZER(vmem_list);
576 1.30 yamt #endif /* defined(_KERNEL) */
577 1.30 yamt
578 1.5 yamt #if defined(QCACHE)
579 1.5 yamt static inline vm_flag_t
580 1.5 yamt prf_to_vmf(int prflags)
581 1.5 yamt {
582 1.5 yamt vm_flag_t vmflags;
583 1.5 yamt
584 1.5 yamt KASSERT((prflags & ~(PR_LIMITFAIL | PR_WAITOK | PR_NOWAIT)) == 0);
585 1.5 yamt if ((prflags & PR_WAITOK) != 0) {
586 1.5 yamt vmflags = VM_SLEEP;
587 1.5 yamt } else {
588 1.5 yamt vmflags = VM_NOSLEEP;
589 1.5 yamt }
590 1.5 yamt return vmflags;
591 1.5 yamt }
592 1.5 yamt
593 1.5 yamt static inline int
594 1.5 yamt vmf_to_prf(vm_flag_t vmflags)
595 1.5 yamt {
596 1.5 yamt int prflags;
597 1.5 yamt
598 1.7 yamt if ((vmflags & VM_SLEEP) != 0) {
599 1.5 yamt prflags = PR_WAITOK;
600 1.7 yamt } else {
601 1.5 yamt prflags = PR_NOWAIT;
602 1.5 yamt }
603 1.5 yamt return prflags;
604 1.5 yamt }
605 1.5 yamt
606 1.5 yamt static size_t
607 1.5 yamt qc_poolpage_size(size_t qcache_max)
608 1.5 yamt {
609 1.5 yamt int i;
610 1.5 yamt
611 1.5 yamt for (i = 0; ORDER2SIZE(i) <= qcache_max * 3; i++) {
612 1.5 yamt /* nothing */
613 1.5 yamt }
614 1.5 yamt return ORDER2SIZE(i);
615 1.5 yamt }
616 1.5 yamt
617 1.5 yamt static void *
618 1.5 yamt qc_poolpage_alloc(struct pool *pool, int prflags)
619 1.5 yamt {
620 1.5 yamt qcache_t *qc = QC_POOL_TO_QCACHE(pool);
621 1.5 yamt vmem_t *vm = qc->qc_vmem;
622 1.5 yamt
623 1.5 yamt return (void *)vmem_alloc(vm, pool->pr_alloc->pa_pagesz,
624 1.5 yamt prf_to_vmf(prflags) | VM_INSTANTFIT);
625 1.5 yamt }
626 1.5 yamt
627 1.5 yamt static void
628 1.5 yamt qc_poolpage_free(struct pool *pool, void *addr)
629 1.5 yamt {
630 1.5 yamt qcache_t *qc = QC_POOL_TO_QCACHE(pool);
631 1.5 yamt vmem_t *vm = qc->qc_vmem;
632 1.5 yamt
633 1.5 yamt vmem_free(vm, (vmem_addr_t)addr, pool->pr_alloc->pa_pagesz);
634 1.5 yamt }
635 1.5 yamt
636 1.5 yamt static void
637 1.31 ad qc_init(vmem_t *vm, size_t qcache_max, int ipl)
638 1.5 yamt {
639 1.22 yamt qcache_t *prevqc;
640 1.5 yamt struct pool_allocator *pa;
641 1.5 yamt int qcache_idx_max;
642 1.5 yamt int i;
643 1.5 yamt
644 1.5 yamt KASSERT((qcache_max & vm->vm_quantum_mask) == 0);
645 1.5 yamt if (qcache_max > (VMEM_QCACHE_IDX_MAX << vm->vm_quantum_shift)) {
646 1.5 yamt qcache_max = VMEM_QCACHE_IDX_MAX << vm->vm_quantum_shift;
647 1.5 yamt }
648 1.5 yamt vm->vm_qcache_max = qcache_max;
649 1.5 yamt pa = &vm->vm_qcache_allocator;
650 1.5 yamt memset(pa, 0, sizeof(*pa));
651 1.5 yamt pa->pa_alloc = qc_poolpage_alloc;
652 1.5 yamt pa->pa_free = qc_poolpage_free;
653 1.5 yamt pa->pa_pagesz = qc_poolpage_size(qcache_max);
654 1.5 yamt
655 1.5 yamt qcache_idx_max = qcache_max >> vm->vm_quantum_shift;
656 1.22 yamt prevqc = NULL;
657 1.22 yamt for (i = qcache_idx_max; i > 0; i--) {
658 1.22 yamt qcache_t *qc = &vm->vm_qcache_store[i - 1];
659 1.5 yamt size_t size = i << vm->vm_quantum_shift;
660 1.36.2.1 yamt pool_cache_t pc;
661 1.5 yamt
662 1.5 yamt qc->qc_vmem = vm;
663 1.8 martin snprintf(qc->qc_name, sizeof(qc->qc_name), "%s-%zu",
664 1.5 yamt vm->vm_name, size);
665 1.36.2.1 yamt if (!kmem_running_p()) {
666 1.36.2.1 yamt STATIC_POOL_ALLOC(pc, vmem_pool_cache_t);
667 1.36.2.1 yamt pool_cache_bootstrap(pc, size,
668 1.36.2.1 yamt ORDER2SIZE(vm->vm_quantum_shift), 0,
669 1.36.2.1 yamt PR_NOALIGN | PR_NOTOUCH /* XXX */,
670 1.36.2.1 yamt qc->qc_name, pa, ipl, NULL, NULL, NULL);
671 1.36.2.1 yamt } else {
672 1.36.2.1 yamt pc = pool_cache_init(size,
673 1.36.2.1 yamt ORDER2SIZE(vm->vm_quantum_shift), 0,
674 1.36.2.1 yamt PR_NOALIGN | PR_NOTOUCH /* XXX */,
675 1.36.2.1 yamt qc->qc_name, pa, ipl, NULL, NULL, NULL);
676 1.36.2.1 yamt }
677 1.36.2.1 yamt qc->qc_cache = pc;
678 1.22 yamt if (prevqc != NULL &&
679 1.35 ad qc->qc_cache->pc_pool.pr_itemsperpage ==
680 1.35 ad prevqc->qc_cache->pc_pool.pr_itemsperpage) {
681 1.36.2.1 yamt if (!kmem_running_p()) {
682 1.36.2.1 yamt pool_cache_bootstrap_destroy(pc);
683 1.36.2.1 yamt STATIC_POOL_FREE(vmem_pool_cache_t, pc);
684 1.36.2.1 yamt } else {
685 1.36.2.1 yamt pool_cache_destroy(pc);
686 1.36.2.1 yamt }
687 1.22 yamt vm->vm_qcache[i - 1] = prevqc;
688 1.27 ad continue;
689 1.22 yamt }
690 1.35 ad qc->qc_cache->pc_pool.pr_qcache = qc;
691 1.22 yamt vm->vm_qcache[i - 1] = qc;
692 1.22 yamt prevqc = qc;
693 1.5 yamt }
694 1.5 yamt }
695 1.6 yamt
696 1.23 yamt static void
697 1.23 yamt qc_destroy(vmem_t *vm)
698 1.23 yamt {
699 1.23 yamt const qcache_t *prevqc;
700 1.23 yamt int i;
701 1.23 yamt int qcache_idx_max;
702 1.23 yamt
703 1.36.2.1 yamt KASSERT(!vmem_bootstrap_p(vm));
704 1.23 yamt qcache_idx_max = vm->vm_qcache_max >> vm->vm_quantum_shift;
705 1.23 yamt prevqc = NULL;
706 1.24 yamt for (i = 0; i < qcache_idx_max; i++) {
707 1.24 yamt qcache_t *qc = vm->vm_qcache[i];
708 1.23 yamt
709 1.23 yamt if (prevqc == qc) {
710 1.23 yamt continue;
711 1.23 yamt }
712 1.35 ad pool_cache_destroy(qc->qc_cache);
713 1.23 yamt prevqc = qc;
714 1.23 yamt }
715 1.23 yamt }
716 1.23 yamt
717 1.25 thorpej static bool
718 1.6 yamt qc_reap(vmem_t *vm)
719 1.6 yamt {
720 1.22 yamt const qcache_t *prevqc;
721 1.6 yamt int i;
722 1.6 yamt int qcache_idx_max;
723 1.26 thorpej bool didsomething = false;
724 1.6 yamt
725 1.6 yamt qcache_idx_max = vm->vm_qcache_max >> vm->vm_quantum_shift;
726 1.22 yamt prevqc = NULL;
727 1.24 yamt for (i = 0; i < qcache_idx_max; i++) {
728 1.24 yamt qcache_t *qc = vm->vm_qcache[i];
729 1.6 yamt
730 1.22 yamt if (prevqc == qc) {
731 1.22 yamt continue;
732 1.22 yamt }
733 1.35 ad if (pool_cache_reclaim(qc->qc_cache) != 0) {
734 1.26 thorpej didsomething = true;
735 1.6 yamt }
736 1.22 yamt prevqc = qc;
737 1.6 yamt }
738 1.6 yamt
739 1.6 yamt return didsomething;
740 1.6 yamt }
741 1.5 yamt #endif /* defined(QCACHE) */
742 1.5 yamt
743 1.1 yamt #if defined(_KERNEL)
744 1.1 yamt static int
745 1.1 yamt vmem_init(void)
746 1.1 yamt {
747 1.1 yamt
748 1.30 yamt mutex_init(&vmem_list_lock, MUTEX_DEFAULT, IPL_NONE);
749 1.35 ad pool_cache_bootstrap(&bt_cache, sizeof(bt_t), 0, 0, 0, "vmembt",
750 1.35 ad NULL, IPL_VM, NULL, NULL, NULL);
751 1.1 yamt return 0;
752 1.1 yamt }
753 1.1 yamt #endif /* defined(_KERNEL) */
754 1.1 yamt
755 1.1 yamt static vmem_addr_t
756 1.1 yamt vmem_add1(vmem_t *vm, vmem_addr_t addr, vmem_size_t size, vm_flag_t flags,
757 1.1 yamt int spanbttype)
758 1.1 yamt {
759 1.1 yamt bt_t *btspan;
760 1.1 yamt bt_t *btfree;
761 1.1 yamt
762 1.1 yamt KASSERT((flags & (VM_SLEEP|VM_NOSLEEP)) != 0);
763 1.1 yamt KASSERT((~flags & (VM_SLEEP|VM_NOSLEEP)) != 0);
764 1.1 yamt
765 1.36.2.1 yamt if ((flags & VMC_KVA) != 0) {
766 1.36.2.1 yamt KASSERT(vmem_bootstrap_p(vm));
767 1.36.2.1 yamt KASSERT(CIRCLEQ_EMPTY(&vm->vm_seglist));
768 1.36.2.1 yamt STATIC_POOL_ALLOC(btspan, bt_t);
769 1.36.2.1 yamt STATIC_POOL_ALLOC(btfree, bt_t);
770 1.36.2.1 yamt } else {
771 1.36.2.1 yamt btspan = bt_alloc(vm, flags);
772 1.36.2.1 yamt if (btspan == NULL) {
773 1.36.2.1 yamt return VMEM_ADDR_NULL;
774 1.36.2.1 yamt }
775 1.36.2.1 yamt btfree = bt_alloc(vm, flags);
776 1.36.2.1 yamt if (btfree == NULL) {
777 1.36.2.1 yamt bt_free(vm, btspan);
778 1.36.2.1 yamt return VMEM_ADDR_NULL;
779 1.36.2.1 yamt }
780 1.1 yamt }
781 1.1 yamt
782 1.1 yamt btspan->bt_type = spanbttype;
783 1.1 yamt btspan->bt_start = addr;
784 1.1 yamt btspan->bt_size = size;
785 1.1 yamt
786 1.1 yamt btfree->bt_type = BT_TYPE_FREE;
787 1.1 yamt btfree->bt_start = addr;
788 1.1 yamt btfree->bt_size = size;
789 1.1 yamt
790 1.1 yamt VMEM_LOCK(vm);
791 1.1 yamt bt_insseg_tail(vm, btspan);
792 1.1 yamt bt_insseg(vm, btfree, btspan);
793 1.1 yamt bt_insfree(vm, btfree);
794 1.1 yamt VMEM_UNLOCK(vm);
795 1.1 yamt
796 1.36.2.1 yamt if ((flags & VMC_KVA) != 0) {
797 1.36.2.1 yamt bt_t *bt;
798 1.36.2.1 yamt
799 1.36.2.1 yamt /*
800 1.36.2.1 yamt * leak a bt.
801 1.36.2.1 yamt * this ensure that
802 1.36.2.1 yamt */
803 1.36.2.1 yamt
804 1.36.2.1 yamt bt = bt_alloc(vm, VM_NOSLEEP);
805 1.36.2.1 yamt KASSERT(bt != NULL);
806 1.36.2.1 yamt
807 1.36.2.1 yamt /*
808 1.36.2.1 yamt * don't leave "btfree" on the segment list because
809 1.36.2.1 yamt * bt_free() doesn't expect static tags.
810 1.36.2.1 yamt */
811 1.36.2.1 yamt
812 1.36.2.1 yamt bt = bt_alloc(vm, flags);
813 1.36.2.1 yamt VMEM_LOCK(vm);
814 1.36.2.1 yamt KASSERT(vm->vm_nbusytag == 1);
815 1.36.2.1 yamt bt->bt_start = btfree->bt_start;
816 1.36.2.1 yamt bt->bt_size = btfree->bt_size;
817 1.36.2.1 yamt bt->bt_type = btfree->bt_type;
818 1.36.2.1 yamt bt_insfree(vm, bt);
819 1.36.2.1 yamt bt_insseg(vm, bt, btfree);
820 1.36.2.1 yamt bt_remseg(vm, btfree);
821 1.36.2.1 yamt bt_remfree(vm, btfree);
822 1.36.2.1 yamt VMEM_UNLOCK(vm);
823 1.36.2.1 yamt }
824 1.36.2.1 yamt
825 1.1 yamt return addr;
826 1.1 yamt }
827 1.1 yamt
828 1.30 yamt static void
829 1.30 yamt vmem_destroy1(vmem_t *vm)
830 1.30 yamt {
831 1.30 yamt
832 1.36.2.1 yamt KASSERT(!vmem_bootstrap_p(vm));
833 1.36.2.1 yamt
834 1.30 yamt #if defined(QCACHE)
835 1.30 yamt qc_destroy(vm);
836 1.30 yamt #endif /* defined(QCACHE) */
837 1.30 yamt if (vm->vm_hashlist != NULL) {
838 1.30 yamt int i;
839 1.30 yamt
840 1.30 yamt for (i = 0; i < vm->vm_hashsize; i++) {
841 1.30 yamt bt_t *bt;
842 1.30 yamt
843 1.30 yamt while ((bt = LIST_FIRST(&vm->vm_hashlist[i])) != NULL) {
844 1.30 yamt KASSERT(bt->bt_type == BT_TYPE_SPAN_STATIC);
845 1.30 yamt bt_free(vm, bt);
846 1.30 yamt }
847 1.30 yamt }
848 1.36.2.1 yamt xfree(vm->vm_hashlist,
849 1.36.2.1 yamt sizeof(vmem_hashlist_t *) * vm->vm_hashsize);
850 1.30 yamt }
851 1.31 ad VMEM_LOCK_DESTROY(vm);
852 1.36.2.1 yamt xfree(vm, sizeof(*vm));
853 1.30 yamt }
854 1.30 yamt
855 1.1 yamt static int
856 1.1 yamt vmem_import(vmem_t *vm, vmem_size_t size, vm_flag_t flags)
857 1.1 yamt {
858 1.1 yamt vmem_addr_t addr;
859 1.1 yamt
860 1.1 yamt if (vm->vm_allocfn == NULL) {
861 1.1 yamt return EINVAL;
862 1.1 yamt }
863 1.1 yamt
864 1.1 yamt addr = (*vm->vm_allocfn)(vm->vm_source, size, &size, flags);
865 1.1 yamt if (addr == VMEM_ADDR_NULL) {
866 1.1 yamt return ENOMEM;
867 1.1 yamt }
868 1.1 yamt
869 1.1 yamt if (vmem_add1(vm, addr, size, flags, BT_TYPE_SPAN) == VMEM_ADDR_NULL) {
870 1.1 yamt (*vm->vm_freefn)(vm->vm_source, addr, size);
871 1.1 yamt return ENOMEM;
872 1.1 yamt }
873 1.1 yamt
874 1.1 yamt return 0;
875 1.1 yamt }
876 1.1 yamt
877 1.1 yamt static int
878 1.1 yamt vmem_rehash(vmem_t *vm, size_t newhashsize, vm_flag_t flags)
879 1.1 yamt {
880 1.1 yamt bt_t *bt;
881 1.1 yamt int i;
882 1.36.2.1 yamt vmem_hashlist_t *newhashlist;
883 1.36.2.1 yamt vmem_hashlist_t *oldhashlist;
884 1.1 yamt size_t oldhashsize;
885 1.1 yamt
886 1.1 yamt KASSERT(newhashsize > 0);
887 1.1 yamt
888 1.36.2.1 yamt newhashlist = xmalloc(sizeof(vmem_hashlist_t *) * newhashsize, flags);
889 1.1 yamt if (newhashlist == NULL) {
890 1.1 yamt return ENOMEM;
891 1.1 yamt }
892 1.1 yamt for (i = 0; i < newhashsize; i++) {
893 1.1 yamt LIST_INIT(&newhashlist[i]);
894 1.1 yamt }
895 1.1 yamt
896 1.30 yamt if (!VMEM_TRYLOCK(vm)) {
897 1.36.2.1 yamt xfree(newhashlist, sizeof(vmem_hashlist_t *) * newhashsize);
898 1.30 yamt return EBUSY;
899 1.30 yamt }
900 1.1 yamt oldhashlist = vm->vm_hashlist;
901 1.1 yamt oldhashsize = vm->vm_hashsize;
902 1.1 yamt vm->vm_hashlist = newhashlist;
903 1.1 yamt vm->vm_hashsize = newhashsize;
904 1.1 yamt if (oldhashlist == NULL) {
905 1.1 yamt VMEM_UNLOCK(vm);
906 1.1 yamt return 0;
907 1.1 yamt }
908 1.1 yamt for (i = 0; i < oldhashsize; i++) {
909 1.1 yamt while ((bt = LIST_FIRST(&oldhashlist[i])) != NULL) {
910 1.1 yamt bt_rembusy(vm, bt); /* XXX */
911 1.1 yamt bt_insbusy(vm, bt);
912 1.1 yamt }
913 1.1 yamt }
914 1.1 yamt VMEM_UNLOCK(vm);
915 1.1 yamt
916 1.36.2.1 yamt if (!STATIC_POOL_ELEM_P(vmem_hashlist_t, oldhashlist)) {
917 1.36.2.1 yamt xfree(oldhashlist, sizeof(vmem_hashlist_t *) * oldhashsize);
918 1.36.2.1 yamt }
919 1.1 yamt
920 1.1 yamt return 0;
921 1.1 yamt }
922 1.1 yamt
923 1.10 yamt /*
924 1.10 yamt * vmem_fit: check if a bt can satisfy the given restrictions.
925 1.10 yamt */
926 1.10 yamt
927 1.10 yamt static vmem_addr_t
928 1.10 yamt vmem_fit(const bt_t *bt, vmem_size_t size, vmem_size_t align, vmem_size_t phase,
929 1.10 yamt vmem_size_t nocross, vmem_addr_t minaddr, vmem_addr_t maxaddr)
930 1.10 yamt {
931 1.10 yamt vmem_addr_t start;
932 1.10 yamt vmem_addr_t end;
933 1.10 yamt
934 1.10 yamt KASSERT(bt->bt_size >= size);
935 1.10 yamt
936 1.10 yamt /*
937 1.10 yamt * XXX assumption: vmem_addr_t and vmem_size_t are
938 1.10 yamt * unsigned integer of the same size.
939 1.10 yamt */
940 1.10 yamt
941 1.10 yamt start = bt->bt_start;
942 1.10 yamt if (start < minaddr) {
943 1.10 yamt start = minaddr;
944 1.10 yamt }
945 1.10 yamt end = BT_END(bt);
946 1.10 yamt if (end > maxaddr - 1) {
947 1.10 yamt end = maxaddr - 1;
948 1.10 yamt }
949 1.10 yamt if (start >= end) {
950 1.10 yamt return VMEM_ADDR_NULL;
951 1.10 yamt }
952 1.19 yamt
953 1.19 yamt start = VMEM_ALIGNUP(start - phase, align) + phase;
954 1.10 yamt if (start < bt->bt_start) {
955 1.10 yamt start += align;
956 1.10 yamt }
957 1.19 yamt if (VMEM_CROSS_P(start, start + size - 1, nocross)) {
958 1.10 yamt KASSERT(align < nocross);
959 1.19 yamt start = VMEM_ALIGNUP(start - phase, nocross) + phase;
960 1.10 yamt }
961 1.10 yamt if (start < end && end - start >= size) {
962 1.10 yamt KASSERT((start & (align - 1)) == phase);
963 1.19 yamt KASSERT(!VMEM_CROSS_P(start, start + size - 1, nocross));
964 1.10 yamt KASSERT(minaddr <= start);
965 1.10 yamt KASSERT(maxaddr == 0 || start + size <= maxaddr);
966 1.10 yamt KASSERT(bt->bt_start <= start);
967 1.10 yamt KASSERT(start + size <= BT_END(bt));
968 1.10 yamt return start;
969 1.10 yamt }
970 1.10 yamt return VMEM_ADDR_NULL;
971 1.10 yamt }
972 1.10 yamt
973 1.1 yamt /* ---- vmem API */
974 1.1 yamt
975 1.1 yamt /*
976 1.1 yamt * vmem_create: create an arena.
977 1.1 yamt *
978 1.1 yamt * => must not be called from interrupt context.
979 1.1 yamt */
980 1.1 yamt
981 1.1 yamt vmem_t *
982 1.1 yamt vmem_create(const char *name, vmem_addr_t base, vmem_size_t size,
983 1.1 yamt vmem_size_t quantum,
984 1.1 yamt vmem_addr_t (*allocfn)(vmem_t *, vmem_size_t, vmem_size_t *, vm_flag_t),
985 1.1 yamt void (*freefn)(vmem_t *, vmem_addr_t, vmem_size_t),
986 1.31 ad vmem_t *source, vmem_size_t qcache_max, vm_flag_t flags,
987 1.31 ad int ipl)
988 1.1 yamt {
989 1.1 yamt vmem_t *vm;
990 1.1 yamt int i;
991 1.1 yamt #if defined(_KERNEL)
992 1.1 yamt static ONCE_DECL(control);
993 1.1 yamt #endif /* defined(_KERNEL) */
994 1.1 yamt
995 1.1 yamt KASSERT((flags & (VM_SLEEP|VM_NOSLEEP)) != 0);
996 1.1 yamt KASSERT((~flags & (VM_SLEEP|VM_NOSLEEP)) != 0);
997 1.1 yamt
998 1.1 yamt #if defined(_KERNEL)
999 1.1 yamt if (RUN_ONCE(&control, vmem_init)) {
1000 1.1 yamt return NULL;
1001 1.1 yamt }
1002 1.1 yamt #endif /* defined(_KERNEL) */
1003 1.36.2.1 yamt if ((flags & (VMC_KVA|VMC_KMEM)) != 0) {
1004 1.36.2.1 yamt STATIC_POOL_ALLOC(vm, vmem_t);
1005 1.36.2.1 yamt } else {
1006 1.36.2.1 yamt vm = xmalloc(sizeof(*vm), flags);
1007 1.36.2.1 yamt if (vm == NULL) {
1008 1.36.2.1 yamt return NULL;
1009 1.36.2.1 yamt }
1010 1.1 yamt }
1011 1.1 yamt
1012 1.31 ad VMEM_LOCK_INIT(vm, ipl);
1013 1.1 yamt vm->vm_name = name;
1014 1.36.2.1 yamt vm->vm_flags = flags;
1015 1.36.2.1 yamt vm->vm_freetags = 0;
1016 1.1 yamt vm->vm_quantum_mask = quantum - 1;
1017 1.1 yamt vm->vm_quantum_shift = calc_order(quantum);
1018 1.4 yamt KASSERT(ORDER2SIZE(vm->vm_quantum_shift) == quantum);
1019 1.1 yamt vm->vm_allocfn = allocfn;
1020 1.1 yamt vm->vm_freefn = freefn;
1021 1.1 yamt vm->vm_source = source;
1022 1.1 yamt vm->vm_nbusytag = 0;
1023 1.5 yamt #if defined(QCACHE)
1024 1.31 ad qc_init(vm, qcache_max, ipl);
1025 1.5 yamt #endif /* defined(QCACHE) */
1026 1.1 yamt
1027 1.1 yamt CIRCLEQ_INIT(&vm->vm_seglist);
1028 1.1 yamt for (i = 0; i < VMEM_MAXORDER; i++) {
1029 1.1 yamt LIST_INIT(&vm->vm_freelist[i]);
1030 1.1 yamt }
1031 1.1 yamt vm->vm_hashlist = NULL;
1032 1.36.2.1 yamt if ((flags & (VMC_KVA|VMC_KMEM)) != 0) {
1033 1.36.2.1 yamt STATIC_POOL_ALLOC(vm->vm_hashlist, vmem_hashlist_t);
1034 1.36.2.1 yamt LIST_INIT(&vm->vm_hashlist[0]);
1035 1.36.2.1 yamt vm->vm_hashsize = 1;
1036 1.36.2.1 yamt } else if (vmem_rehash(vm, VMEM_HASHSIZE_INIT, flags)) {
1037 1.30 yamt vmem_destroy1(vm);
1038 1.1 yamt return NULL;
1039 1.1 yamt }
1040 1.1 yamt
1041 1.1 yamt if (size != 0) {
1042 1.1 yamt if (vmem_add(vm, base, size, flags) == 0) {
1043 1.30 yamt vmem_destroy1(vm);
1044 1.1 yamt return NULL;
1045 1.1 yamt }
1046 1.1 yamt }
1047 1.1 yamt
1048 1.30 yamt #if defined(_KERNEL)
1049 1.30 yamt mutex_enter(&vmem_list_lock);
1050 1.30 yamt LIST_INSERT_HEAD(&vmem_list, vm, vm_alllist);
1051 1.30 yamt mutex_exit(&vmem_list_lock);
1052 1.30 yamt #endif /* defined(_KERNEL) */
1053 1.30 yamt
1054 1.36.2.1 yamt #if 0
1055 1.36.2.1 yamt if (vmem_bootstrap_p(vm)) {
1056 1.36.2.1 yamt vmem_rehash(vm, VMEM_HASHSIZE_INIT, flags);
1057 1.36.2.1 yamt }
1058 1.36.2.1 yamt #endif
1059 1.36.2.1 yamt
1060 1.1 yamt return vm;
1061 1.1 yamt }
1062 1.1 yamt
1063 1.1 yamt void
1064 1.1 yamt vmem_destroy(vmem_t *vm)
1065 1.1 yamt {
1066 1.1 yamt
1067 1.30 yamt #if defined(_KERNEL)
1068 1.30 yamt mutex_enter(&vmem_list_lock);
1069 1.30 yamt LIST_REMOVE(vm, vm_alllist);
1070 1.30 yamt mutex_exit(&vmem_list_lock);
1071 1.30 yamt #endif /* defined(_KERNEL) */
1072 1.1 yamt
1073 1.30 yamt vmem_destroy1(vm);
1074 1.1 yamt }
1075 1.1 yamt
1076 1.1 yamt vmem_size_t
1077 1.1 yamt vmem_roundup_size(vmem_t *vm, vmem_size_t size)
1078 1.1 yamt {
1079 1.1 yamt
1080 1.1 yamt return (size + vm->vm_quantum_mask) & ~vm->vm_quantum_mask;
1081 1.1 yamt }
1082 1.1 yamt
1083 1.1 yamt /*
1084 1.1 yamt * vmem_alloc:
1085 1.1 yamt *
1086 1.1 yamt * => caller must ensure appropriate spl,
1087 1.1 yamt * if the arena can be accessed from interrupt context.
1088 1.1 yamt */
1089 1.1 yamt
1090 1.1 yamt vmem_addr_t
1091 1.1 yamt vmem_alloc(vmem_t *vm, vmem_size_t size0, vm_flag_t flags)
1092 1.1 yamt {
1093 1.12 yamt const vmem_size_t size __unused = vmem_roundup_size(vm, size0);
1094 1.12 yamt const vm_flag_t strat __unused = flags & VM_FITMASK;
1095 1.1 yamt
1096 1.1 yamt KASSERT((flags & (VM_SLEEP|VM_NOSLEEP)) != 0);
1097 1.1 yamt KASSERT((~flags & (VM_SLEEP|VM_NOSLEEP)) != 0);
1098 1.1 yamt
1099 1.1 yamt KASSERT(size0 > 0);
1100 1.1 yamt KASSERT(size > 0);
1101 1.1 yamt KASSERT(strat == VM_BESTFIT || strat == VM_INSTANTFIT);
1102 1.3 yamt if ((flags & VM_SLEEP) != 0) {
1103 1.16 yamt ASSERT_SLEEPABLE(NULL, __func__);
1104 1.3 yamt }
1105 1.1 yamt
1106 1.5 yamt #if defined(QCACHE)
1107 1.5 yamt if (size <= vm->vm_qcache_max) {
1108 1.5 yamt int qidx = size >> vm->vm_quantum_shift;
1109 1.22 yamt qcache_t *qc = vm->vm_qcache[qidx - 1];
1110 1.5 yamt
1111 1.35 ad return (vmem_addr_t)pool_cache_get(qc->qc_cache,
1112 1.5 yamt vmf_to_prf(flags));
1113 1.5 yamt }
1114 1.5 yamt #endif /* defined(QCACHE) */
1115 1.5 yamt
1116 1.10 yamt return vmem_xalloc(vm, size0, 0, 0, 0, 0, 0, flags);
1117 1.10 yamt }
1118 1.10 yamt
1119 1.10 yamt vmem_addr_t
1120 1.10 yamt vmem_xalloc(vmem_t *vm, vmem_size_t size0, vmem_size_t align, vmem_size_t phase,
1121 1.10 yamt vmem_size_t nocross, vmem_addr_t minaddr, vmem_addr_t maxaddr,
1122 1.10 yamt vm_flag_t flags)
1123 1.10 yamt {
1124 1.10 yamt struct vmem_freelist *list;
1125 1.10 yamt struct vmem_freelist *first;
1126 1.10 yamt struct vmem_freelist *end;
1127 1.10 yamt bt_t *bt;
1128 1.10 yamt bt_t *btnew;
1129 1.10 yamt bt_t *btnew2;
1130 1.10 yamt const vmem_size_t size = vmem_roundup_size(vm, size0);
1131 1.10 yamt vm_flag_t strat = flags & VM_FITMASK;
1132 1.10 yamt vmem_addr_t start;
1133 1.36.2.1 yamt struct vm_page *pg;
1134 1.10 yamt
1135 1.10 yamt KASSERT(size0 > 0);
1136 1.10 yamt KASSERT(size > 0);
1137 1.10 yamt KASSERT(strat == VM_BESTFIT || strat == VM_INSTANTFIT);
1138 1.10 yamt if ((flags & VM_SLEEP) != 0) {
1139 1.16 yamt ASSERT_SLEEPABLE(NULL, __func__);
1140 1.10 yamt }
1141 1.10 yamt KASSERT((align & vm->vm_quantum_mask) == 0);
1142 1.10 yamt KASSERT((align & (align - 1)) == 0);
1143 1.10 yamt KASSERT((phase & vm->vm_quantum_mask) == 0);
1144 1.10 yamt KASSERT((nocross & vm->vm_quantum_mask) == 0);
1145 1.10 yamt KASSERT((nocross & (nocross - 1)) == 0);
1146 1.10 yamt KASSERT((align == 0 && phase == 0) || phase < align);
1147 1.10 yamt KASSERT(nocross == 0 || nocross >= size);
1148 1.10 yamt KASSERT(maxaddr == 0 || minaddr < maxaddr);
1149 1.19 yamt KASSERT(!VMEM_CROSS_P(phase, phase + size - 1, nocross));
1150 1.10 yamt
1151 1.10 yamt if (align == 0) {
1152 1.10 yamt align = vm->vm_quantum_mask + 1;
1153 1.10 yamt }
1154 1.36.2.1 yamt pg = NULL;
1155 1.36.2.1 yamt if ((flags & VM_BTPAGE) != 0) {
1156 1.36.2.1 yamt KASSERT(size == PAGE_SIZE);
1157 1.36.2.1 yamt KASSERT(align == PAGE_SIZE);
1158 1.36.2.1 yamt while (pg == NULL) {
1159 1.36.2.1 yamt pg = uvm_pagealloc(NULL, 0, NULL, 0);
1160 1.36.2.1 yamt if (pg == NULL) {
1161 1.36.2.1 yamt if ((flags & VM_NOSLEEP) != 0) {
1162 1.36.2.1 yamt return ENOMEM;
1163 1.36.2.1 yamt }
1164 1.36.2.1 yamt uvm_wait("btpage");
1165 1.36.2.1 yamt }
1166 1.36.2.1 yamt }
1167 1.36.2.1 yamt btnew = NULL; /* XXX: gcc */
1168 1.36.2.1 yamt btnew2 = NULL;
1169 1.36.2.1 yamt } else {
1170 1.36.2.1 yamt btnew = bt_alloc(vm, flags);
1171 1.36.2.1 yamt if (btnew == NULL) {
1172 1.36.2.1 yamt return VMEM_ADDR_NULL;
1173 1.36.2.1 yamt }
1174 1.36.2.1 yamt /* XXX not necessary if no restrictions */
1175 1.36.2.1 yamt btnew2 = bt_alloc(vm, flags);
1176 1.36.2.1 yamt if (btnew2 == NULL) {
1177 1.36.2.1 yamt bt_free(vm, btnew);
1178 1.36.2.1 yamt return VMEM_ADDR_NULL;
1179 1.36.2.1 yamt }
1180 1.10 yamt }
1181 1.1 yamt
1182 1.1 yamt retry_strat:
1183 1.1 yamt first = bt_freehead_toalloc(vm, size, strat);
1184 1.1 yamt end = &vm->vm_freelist[VMEM_MAXORDER];
1185 1.1 yamt retry:
1186 1.1 yamt bt = NULL;
1187 1.1 yamt VMEM_LOCK(vm);
1188 1.2 yamt if (strat == VM_INSTANTFIT) {
1189 1.2 yamt for (list = first; list < end; list++) {
1190 1.2 yamt bt = LIST_FIRST(list);
1191 1.2 yamt if (bt != NULL) {
1192 1.10 yamt start = vmem_fit(bt, size, align, phase,
1193 1.10 yamt nocross, minaddr, maxaddr);
1194 1.10 yamt if (start != VMEM_ADDR_NULL) {
1195 1.10 yamt goto gotit;
1196 1.10 yamt }
1197 1.2 yamt }
1198 1.2 yamt }
1199 1.2 yamt } else { /* VM_BESTFIT */
1200 1.2 yamt for (list = first; list < end; list++) {
1201 1.2 yamt LIST_FOREACH(bt, list, bt_freelist) {
1202 1.2 yamt if (bt->bt_size >= size) {
1203 1.10 yamt start = vmem_fit(bt, size, align, phase,
1204 1.10 yamt nocross, minaddr, maxaddr);
1205 1.10 yamt if (start != VMEM_ADDR_NULL) {
1206 1.10 yamt goto gotit;
1207 1.10 yamt }
1208 1.2 yamt }
1209 1.1 yamt }
1210 1.1 yamt }
1211 1.1 yamt }
1212 1.2 yamt VMEM_UNLOCK(vm);
1213 1.1 yamt #if 1
1214 1.2 yamt if (strat == VM_INSTANTFIT) {
1215 1.2 yamt strat = VM_BESTFIT;
1216 1.2 yamt goto retry_strat;
1217 1.2 yamt }
1218 1.1 yamt #endif
1219 1.10 yamt if (align != vm->vm_quantum_mask + 1 || phase != 0 ||
1220 1.10 yamt nocross != 0 || minaddr != 0 || maxaddr != 0) {
1221 1.10 yamt
1222 1.10 yamt /*
1223 1.10 yamt * XXX should try to import a region large enough to
1224 1.10 yamt * satisfy restrictions?
1225 1.10 yamt */
1226 1.10 yamt
1227 1.20 yamt goto fail;
1228 1.10 yamt }
1229 1.2 yamt if (vmem_import(vm, size, flags) == 0) {
1230 1.2 yamt goto retry;
1231 1.1 yamt }
1232 1.2 yamt /* XXX */
1233 1.20 yamt fail:
1234 1.36.2.1 yamt if ((flags & VM_BTPAGE) != 0) {
1235 1.36.2.1 yamt uvm_pagefree(pg);
1236 1.36.2.1 yamt } else {
1237 1.36.2.1 yamt bt_free(vm, btnew);
1238 1.36.2.1 yamt bt_free(vm, btnew2);
1239 1.36.2.1 yamt }
1240 1.2 yamt return VMEM_ADDR_NULL;
1241 1.2 yamt
1242 1.2 yamt gotit:
1243 1.36.2.1 yamt #if defined(PMAP_GROWKERNEL)
1244 1.36.2.1 yamt if ((vm->vm_flags & VMC_KVA) != 0) {
1245 1.36.2.1 yamt uvm_growkernel(start + size);
1246 1.36.2.1 yamt }
1247 1.36.2.1 yamt #endif /* defined(PMAP_GROWKERNEL) */
1248 1.36.2.1 yamt if ((flags & VM_BTPAGE) != 0) {
1249 1.36.2.1 yamt vaddr_t va = (vaddr_t)start;
1250 1.36.2.1 yamt
1251 1.36.2.1 yamt KASSERT(bt->bt_start == start);
1252 1.36.2.1 yamt btnew = bt_alloc_bootstrap(vm);
1253 1.36.2.1 yamt btpage_init(vm, pg, va);
1254 1.36.2.1 yamt }
1255 1.1 yamt KASSERT(bt->bt_type == BT_TYPE_FREE);
1256 1.1 yamt KASSERT(bt->bt_size >= size);
1257 1.1 yamt bt_remfree(vm, bt);
1258 1.10 yamt if (bt->bt_start != start) {
1259 1.10 yamt btnew2->bt_type = BT_TYPE_FREE;
1260 1.10 yamt btnew2->bt_start = bt->bt_start;
1261 1.10 yamt btnew2->bt_size = start - bt->bt_start;
1262 1.10 yamt bt->bt_start = start;
1263 1.10 yamt bt->bt_size -= btnew2->bt_size;
1264 1.10 yamt bt_insfree(vm, btnew2);
1265 1.10 yamt bt_insseg(vm, btnew2, CIRCLEQ_PREV(bt, bt_seglist));
1266 1.10 yamt btnew2 = NULL;
1267 1.10 yamt }
1268 1.10 yamt KASSERT(bt->bt_start == start);
1269 1.1 yamt if (bt->bt_size != size && bt->bt_size - size > vm->vm_quantum_mask) {
1270 1.1 yamt /* split */
1271 1.1 yamt btnew->bt_type = BT_TYPE_BUSY;
1272 1.1 yamt btnew->bt_start = bt->bt_start;
1273 1.1 yamt btnew->bt_size = size;
1274 1.1 yamt bt->bt_start = bt->bt_start + size;
1275 1.1 yamt bt->bt_size -= size;
1276 1.1 yamt bt_insfree(vm, bt);
1277 1.1 yamt bt_insseg(vm, btnew, CIRCLEQ_PREV(bt, bt_seglist));
1278 1.1 yamt bt_insbusy(vm, btnew);
1279 1.1 yamt VMEM_UNLOCK(vm);
1280 1.1 yamt } else {
1281 1.1 yamt bt->bt_type = BT_TYPE_BUSY;
1282 1.1 yamt bt_insbusy(vm, bt);
1283 1.1 yamt VMEM_UNLOCK(vm);
1284 1.1 yamt bt_free(vm, btnew);
1285 1.1 yamt btnew = bt;
1286 1.1 yamt }
1287 1.10 yamt if (btnew2 != NULL) {
1288 1.10 yamt bt_free(vm, btnew2);
1289 1.10 yamt }
1290 1.1 yamt KASSERT(btnew->bt_size >= size);
1291 1.1 yamt btnew->bt_type = BT_TYPE_BUSY;
1292 1.1 yamt
1293 1.1 yamt return btnew->bt_start;
1294 1.1 yamt }
1295 1.1 yamt
1296 1.1 yamt /*
1297 1.1 yamt * vmem_free:
1298 1.1 yamt *
1299 1.1 yamt * => caller must ensure appropriate spl,
1300 1.1 yamt * if the arena can be accessed from interrupt context.
1301 1.1 yamt */
1302 1.1 yamt
1303 1.1 yamt void
1304 1.1 yamt vmem_free(vmem_t *vm, vmem_addr_t addr, vmem_size_t size)
1305 1.1 yamt {
1306 1.1 yamt
1307 1.1 yamt KASSERT(addr != VMEM_ADDR_NULL);
1308 1.1 yamt KASSERT(size > 0);
1309 1.1 yamt
1310 1.5 yamt #if defined(QCACHE)
1311 1.5 yamt if (size <= vm->vm_qcache_max) {
1312 1.5 yamt int qidx = (size + vm->vm_quantum_mask) >> vm->vm_quantum_shift;
1313 1.22 yamt qcache_t *qc = vm->vm_qcache[qidx - 1];
1314 1.5 yamt
1315 1.35 ad return pool_cache_put(qc->qc_cache, (void *)addr);
1316 1.5 yamt }
1317 1.5 yamt #endif /* defined(QCACHE) */
1318 1.5 yamt
1319 1.10 yamt vmem_xfree(vm, addr, size);
1320 1.10 yamt }
1321 1.10 yamt
1322 1.10 yamt void
1323 1.17 yamt vmem_xfree(vmem_t *vm, vmem_addr_t addr, vmem_size_t size)
1324 1.10 yamt {
1325 1.10 yamt bt_t *bt;
1326 1.10 yamt bt_t *t;
1327 1.36.2.1 yamt SLIST_HEAD(, vmem_btag) tofree;
1328 1.10 yamt
1329 1.10 yamt KASSERT(addr != VMEM_ADDR_NULL);
1330 1.10 yamt KASSERT(size > 0);
1331 1.10 yamt
1332 1.36.2.1 yamt SLIST_INIT(&tofree);
1333 1.36.2.1 yamt
1334 1.1 yamt VMEM_LOCK(vm);
1335 1.1 yamt
1336 1.1 yamt bt = bt_lookupbusy(vm, addr);
1337 1.1 yamt KASSERT(bt != NULL);
1338 1.1 yamt KASSERT(bt->bt_start == addr);
1339 1.1 yamt KASSERT(bt->bt_size == vmem_roundup_size(vm, size) ||
1340 1.1 yamt bt->bt_size - vmem_roundup_size(vm, size) <= vm->vm_quantum_mask);
1341 1.1 yamt KASSERT(bt->bt_type == BT_TYPE_BUSY);
1342 1.1 yamt bt_rembusy(vm, bt);
1343 1.1 yamt bt->bt_type = BT_TYPE_FREE;
1344 1.1 yamt
1345 1.1 yamt /* coalesce */
1346 1.1 yamt t = CIRCLEQ_NEXT(bt, bt_seglist);
1347 1.1 yamt if (t != NULL && t->bt_type == BT_TYPE_FREE) {
1348 1.1 yamt KASSERT(BT_END(bt) == t->bt_start);
1349 1.1 yamt bt_remfree(vm, t);
1350 1.1 yamt bt_remseg(vm, t);
1351 1.1 yamt bt->bt_size += t->bt_size;
1352 1.36.2.1 yamt SLIST_INSERT_HEAD(&tofree, t, bt_tmplist);
1353 1.1 yamt }
1354 1.1 yamt t = CIRCLEQ_PREV(bt, bt_seglist);
1355 1.1 yamt if (t != NULL && t->bt_type == BT_TYPE_FREE) {
1356 1.1 yamt KASSERT(BT_END(t) == bt->bt_start);
1357 1.1 yamt bt_remfree(vm, t);
1358 1.1 yamt bt_remseg(vm, t);
1359 1.1 yamt bt->bt_size += t->bt_size;
1360 1.1 yamt bt->bt_start = t->bt_start;
1361 1.36.2.1 yamt SLIST_INSERT_HEAD(&tofree, t, bt_tmplist);
1362 1.1 yamt }
1363 1.1 yamt
1364 1.1 yamt t = CIRCLEQ_PREV(bt, bt_seglist);
1365 1.1 yamt KASSERT(t != NULL);
1366 1.1 yamt KASSERT(BT_ISSPAN_P(t) || t->bt_type == BT_TYPE_BUSY);
1367 1.1 yamt if (vm->vm_freefn != NULL && t->bt_type == BT_TYPE_SPAN &&
1368 1.1 yamt t->bt_size == bt->bt_size) {
1369 1.1 yamt vmem_addr_t spanaddr;
1370 1.1 yamt vmem_size_t spansize;
1371 1.1 yamt
1372 1.1 yamt KASSERT(t->bt_start == bt->bt_start);
1373 1.1 yamt spanaddr = bt->bt_start;
1374 1.1 yamt spansize = bt->bt_size;
1375 1.1 yamt bt_remseg(vm, bt);
1376 1.36.2.1 yamt SLIST_INSERT_HEAD(&tofree, bt, bt_tmplist);
1377 1.1 yamt bt_remseg(vm, t);
1378 1.36.2.1 yamt SLIST_INSERT_HEAD(&tofree, t, bt_tmplist);
1379 1.1 yamt VMEM_UNLOCK(vm);
1380 1.1 yamt (*vm->vm_freefn)(vm->vm_source, spanaddr, spansize);
1381 1.1 yamt } else {
1382 1.1 yamt bt_insfree(vm, bt);
1383 1.1 yamt VMEM_UNLOCK(vm);
1384 1.1 yamt }
1385 1.36.2.1 yamt while ((t = SLIST_FIRST(&tofree)) != NULL) {
1386 1.36.2.1 yamt SLIST_REMOVE_HEAD(&tofree, bt_tmplist);
1387 1.36.2.1 yamt bt_free(vm, t);
1388 1.36.2.1 yamt }
1389 1.1 yamt }
1390 1.1 yamt
1391 1.1 yamt /*
1392 1.1 yamt * vmem_add:
1393 1.1 yamt *
1394 1.1 yamt * => caller must ensure appropriate spl,
1395 1.1 yamt * if the arena can be accessed from interrupt context.
1396 1.1 yamt */
1397 1.1 yamt
1398 1.1 yamt vmem_addr_t
1399 1.1 yamt vmem_add(vmem_t *vm, vmem_addr_t addr, vmem_size_t size, vm_flag_t flags)
1400 1.1 yamt {
1401 1.1 yamt
1402 1.1 yamt return vmem_add1(vm, addr, size, flags, BT_TYPE_SPAN_STATIC);
1403 1.1 yamt }
1404 1.1 yamt
1405 1.6 yamt /*
1406 1.6 yamt * vmem_reap: reap unused resources.
1407 1.6 yamt *
1408 1.26 thorpej * => return true if we successfully reaped something.
1409 1.6 yamt */
1410 1.6 yamt
1411 1.25 thorpej bool
1412 1.6 yamt vmem_reap(vmem_t *vm)
1413 1.6 yamt {
1414 1.26 thorpej bool didsomething = false;
1415 1.6 yamt
1416 1.6 yamt #if defined(QCACHE)
1417 1.6 yamt didsomething = qc_reap(vm);
1418 1.6 yamt #endif /* defined(QCACHE) */
1419 1.6 yamt return didsomething;
1420 1.6 yamt }
1421 1.6 yamt
1422 1.30 yamt /* ---- rehash */
1423 1.30 yamt
1424 1.30 yamt #if defined(_KERNEL)
1425 1.30 yamt static struct callout vmem_rehash_ch;
1426 1.30 yamt static int vmem_rehash_interval;
1427 1.30 yamt static struct workqueue *vmem_rehash_wq;
1428 1.30 yamt static struct work vmem_rehash_wk;
1429 1.30 yamt
1430 1.30 yamt static void
1431 1.30 yamt vmem_rehash_all(struct work *wk, void *dummy)
1432 1.30 yamt {
1433 1.30 yamt vmem_t *vm;
1434 1.30 yamt
1435 1.30 yamt KASSERT(wk == &vmem_rehash_wk);
1436 1.30 yamt mutex_enter(&vmem_list_lock);
1437 1.30 yamt LIST_FOREACH(vm, &vmem_list, vm_alllist) {
1438 1.30 yamt size_t desired;
1439 1.30 yamt size_t current;
1440 1.30 yamt
1441 1.30 yamt if (!VMEM_TRYLOCK(vm)) {
1442 1.30 yamt continue;
1443 1.30 yamt }
1444 1.30 yamt desired = vm->vm_nbusytag;
1445 1.30 yamt current = vm->vm_hashsize;
1446 1.30 yamt VMEM_UNLOCK(vm);
1447 1.30 yamt
1448 1.30 yamt if (desired > VMEM_HASHSIZE_MAX) {
1449 1.30 yamt desired = VMEM_HASHSIZE_MAX;
1450 1.30 yamt } else if (desired < VMEM_HASHSIZE_MIN) {
1451 1.30 yamt desired = VMEM_HASHSIZE_MIN;
1452 1.30 yamt }
1453 1.30 yamt if (desired > current * 2 || desired * 2 < current) {
1454 1.30 yamt vmem_rehash(vm, desired, VM_NOSLEEP);
1455 1.30 yamt }
1456 1.30 yamt }
1457 1.30 yamt mutex_exit(&vmem_list_lock);
1458 1.30 yamt
1459 1.30 yamt callout_schedule(&vmem_rehash_ch, vmem_rehash_interval);
1460 1.30 yamt }
1461 1.30 yamt
1462 1.30 yamt static void
1463 1.30 yamt vmem_rehash_all_kick(void *dummy)
1464 1.30 yamt {
1465 1.30 yamt
1466 1.32 rmind workqueue_enqueue(vmem_rehash_wq, &vmem_rehash_wk, NULL);
1467 1.30 yamt }
1468 1.30 yamt
1469 1.30 yamt void
1470 1.30 yamt vmem_rehash_start(void)
1471 1.30 yamt {
1472 1.30 yamt int error;
1473 1.30 yamt
1474 1.30 yamt error = workqueue_create(&vmem_rehash_wq, "vmem_rehash",
1475 1.34 ad vmem_rehash_all, NULL, PRI_VM, IPL_SOFTCLOCK, 0);
1476 1.30 yamt if (error) {
1477 1.30 yamt panic("%s: workqueue_create %d\n", __func__, error);
1478 1.30 yamt }
1479 1.31 ad callout_init(&vmem_rehash_ch, 0);
1480 1.30 yamt callout_setfunc(&vmem_rehash_ch, vmem_rehash_all_kick, NULL);
1481 1.30 yamt
1482 1.30 yamt vmem_rehash_interval = hz * 10;
1483 1.30 yamt callout_schedule(&vmem_rehash_ch, vmem_rehash_interval);
1484 1.30 yamt }
1485 1.30 yamt #endif /* defined(_KERNEL) */
1486 1.30 yamt
1487 1.1 yamt /* ---- debug */
1488 1.1 yamt
1489 1.1 yamt #if defined(VMEM_DEBUG)
1490 1.1 yamt
1491 1.1 yamt #if !defined(_KERNEL)
1492 1.1 yamt #include <stdio.h>
1493 1.1 yamt #endif /* !defined(_KERNEL) */
1494 1.1 yamt
1495 1.1 yamt void bt_dump(const bt_t *);
1496 1.1 yamt
1497 1.1 yamt void
1498 1.1 yamt bt_dump(const bt_t *bt)
1499 1.1 yamt {
1500 1.1 yamt
1501 1.36.2.1 yamt printf("\t%p: %" PRIu64 "(0x%" PRIx64 "), %" PRIu64 "(0x%" PRIx64
1502 1.36.2.1 yamt "), %d\n",
1503 1.36.2.1 yamt bt,
1504 1.36.2.1 yamt (uint64_t)bt->bt_start, (uint64_t)bt->bt_start,
1505 1.36.2.1 yamt (uint64_t)bt->bt_size, (uint64_t)bt->bt_size,
1506 1.1 yamt bt->bt_type);
1507 1.1 yamt }
1508 1.1 yamt
1509 1.1 yamt void
1510 1.36.2.1 yamt vmem_dump_seglist(const vmem_t *vm)
1511 1.1 yamt {
1512 1.1 yamt const bt_t *bt;
1513 1.1 yamt
1514 1.36.2.1 yamt printf("vmem %p '%s' SEGLIST\n", vm, vm->vm_name);
1515 1.36.2.1 yamt
1516 1.1 yamt CIRCLEQ_FOREACH(bt, &vm->vm_seglist, bt_seglist) {
1517 1.1 yamt bt_dump(bt);
1518 1.1 yamt }
1519 1.36.2.1 yamt }
1520 1.36.2.1 yamt
1521 1.36.2.1 yamt void
1522 1.36.2.1 yamt vmem_dump_freelist(const vmem_t *vm)
1523 1.36.2.1 yamt {
1524 1.36.2.1 yamt const bt_t *bt;
1525 1.36.2.1 yamt int i;
1526 1.36.2.1 yamt
1527 1.36.2.1 yamt printf("vmem %p '%s' FREELIST\n", vm, vm->vm_name);
1528 1.1 yamt
1529 1.1 yamt for (i = 0; i < VMEM_MAXORDER; i++) {
1530 1.1 yamt const struct vmem_freelist *fl = &vm->vm_freelist[i];
1531 1.1 yamt
1532 1.1 yamt if (LIST_EMPTY(fl)) {
1533 1.1 yamt continue;
1534 1.1 yamt }
1535 1.1 yamt
1536 1.1 yamt printf("freelist[%d]\n", i);
1537 1.1 yamt LIST_FOREACH(bt, fl, bt_freelist) {
1538 1.1 yamt bt_dump(bt);
1539 1.1 yamt }
1540 1.1 yamt }
1541 1.1 yamt }
1542 1.1 yamt
1543 1.36.2.1 yamt #if defined(QCACHE)
1544 1.36.2.1 yamt void
1545 1.36.2.1 yamt vmem_dump_qc(const vmem_t *vm)
1546 1.36.2.1 yamt {
1547 1.36.2.1 yamt int qcache_idx_max = vm->vm_qcache_max >> vm->vm_quantum_shift;
1548 1.36.2.1 yamt int i;
1549 1.36.2.1 yamt const qcache_t *prevqc;
1550 1.36.2.1 yamt
1551 1.36.2.1 yamt printf("qcache_max=%zu\n", vm->vm_qcache_max);
1552 1.36.2.1 yamt
1553 1.36.2.1 yamt prevqc = NULL;
1554 1.36.2.1 yamt for (i = 0; i < qcache_idx_max; i++) {
1555 1.36.2.1 yamt const qcache_t *qc;
1556 1.36.2.1 yamt
1557 1.36.2.1 yamt qc = vm->vm_qcache[i];
1558 1.36.2.1 yamt if (prevqc != qc) {
1559 1.36.2.1 yamt printf("CACHE[%d] (%zu-) %p\n",
1560 1.36.2.1 yamt i, (size_t)i << vm->vm_quantum_shift, qc->qc_cache);
1561 1.36.2.1 yamt }
1562 1.36.2.1 yamt prevqc = qc;
1563 1.36.2.1 yamt }
1564 1.36.2.1 yamt }
1565 1.36.2.1 yamt #endif /* defined(QCACHE) */
1566 1.36.2.1 yamt
1567 1.36.2.1 yamt void
1568 1.36.2.1 yamt vmem_dump(const vmem_t *vm)
1569 1.36.2.1 yamt {
1570 1.36.2.1 yamt
1571 1.36.2.1 yamt printf("vmem %p '%s'\n", vm, vm->vm_name);
1572 1.36.2.1 yamt vmem_dump_seglist(vm);
1573 1.36.2.1 yamt vmem_dump_freelist(vm);
1574 1.36.2.1 yamt #if defined(QCACHE)
1575 1.36.2.1 yamt vmem_dump_qc(vm);
1576 1.36.2.1 yamt #endif /* defined(QCACHE) */
1577 1.36.2.1 yamt }
1578 1.36.2.1 yamt
1579 1.1 yamt #if !defined(_KERNEL)
1580 1.1 yamt
1581 1.1 yamt int
1582 1.1 yamt main()
1583 1.1 yamt {
1584 1.1 yamt vmem_t *vm;
1585 1.1 yamt vmem_addr_t p;
1586 1.1 yamt struct reg {
1587 1.1 yamt vmem_addr_t p;
1588 1.1 yamt vmem_size_t sz;
1589 1.25 thorpej bool x;
1590 1.1 yamt } *reg = NULL;
1591 1.1 yamt int nreg = 0;
1592 1.1 yamt int nalloc = 0;
1593 1.1 yamt int nfree = 0;
1594 1.1 yamt vmem_size_t total = 0;
1595 1.1 yamt #if 1
1596 1.1 yamt vm_flag_t strat = VM_INSTANTFIT;
1597 1.1 yamt #else
1598 1.1 yamt vm_flag_t strat = VM_BESTFIT;
1599 1.1 yamt #endif
1600 1.1 yamt
1601 1.1 yamt vm = vmem_create("test", VMEM_ADDR_NULL, 0, 1,
1602 1.30 yamt NULL, NULL, NULL, 0, VM_SLEEP);
1603 1.1 yamt if (vm == NULL) {
1604 1.1 yamt printf("vmem_create\n");
1605 1.1 yamt exit(EXIT_FAILURE);
1606 1.1 yamt }
1607 1.1 yamt vmem_dump(vm);
1608 1.1 yamt
1609 1.1 yamt p = vmem_add(vm, 100, 200, VM_SLEEP);
1610 1.1 yamt p = vmem_add(vm, 2000, 1, VM_SLEEP);
1611 1.1 yamt p = vmem_add(vm, 40000, 0x10000000>>12, VM_SLEEP);
1612 1.1 yamt p = vmem_add(vm, 10000, 10000, VM_SLEEP);
1613 1.1 yamt p = vmem_add(vm, 500, 1000, VM_SLEEP);
1614 1.1 yamt vmem_dump(vm);
1615 1.1 yamt for (;;) {
1616 1.1 yamt struct reg *r;
1617 1.10 yamt int t = rand() % 100;
1618 1.1 yamt
1619 1.10 yamt if (t > 45) {
1620 1.10 yamt /* alloc */
1621 1.1 yamt vmem_size_t sz = rand() % 500 + 1;
1622 1.25 thorpej bool x;
1623 1.10 yamt vmem_size_t align, phase, nocross;
1624 1.10 yamt vmem_addr_t minaddr, maxaddr;
1625 1.10 yamt
1626 1.10 yamt if (t > 70) {
1627 1.26 thorpej x = true;
1628 1.10 yamt /* XXX */
1629 1.10 yamt align = 1 << (rand() % 15);
1630 1.10 yamt phase = rand() % 65536;
1631 1.10 yamt nocross = 1 << (rand() % 15);
1632 1.10 yamt if (align <= phase) {
1633 1.10 yamt phase = 0;
1634 1.10 yamt }
1635 1.19 yamt if (VMEM_CROSS_P(phase, phase + sz - 1,
1636 1.19 yamt nocross)) {
1637 1.10 yamt nocross = 0;
1638 1.10 yamt }
1639 1.10 yamt minaddr = rand() % 50000;
1640 1.10 yamt maxaddr = rand() % 70000;
1641 1.10 yamt if (minaddr > maxaddr) {
1642 1.10 yamt minaddr = 0;
1643 1.10 yamt maxaddr = 0;
1644 1.10 yamt }
1645 1.10 yamt printf("=== xalloc %" PRIu64
1646 1.10 yamt " align=%" PRIu64 ", phase=%" PRIu64
1647 1.10 yamt ", nocross=%" PRIu64 ", min=%" PRIu64
1648 1.10 yamt ", max=%" PRIu64 "\n",
1649 1.10 yamt (uint64_t)sz,
1650 1.10 yamt (uint64_t)align,
1651 1.10 yamt (uint64_t)phase,
1652 1.10 yamt (uint64_t)nocross,
1653 1.10 yamt (uint64_t)minaddr,
1654 1.10 yamt (uint64_t)maxaddr);
1655 1.10 yamt p = vmem_xalloc(vm, sz, align, phase, nocross,
1656 1.10 yamt minaddr, maxaddr, strat|VM_SLEEP);
1657 1.10 yamt } else {
1658 1.26 thorpej x = false;
1659 1.10 yamt printf("=== alloc %" PRIu64 "\n", (uint64_t)sz);
1660 1.10 yamt p = vmem_alloc(vm, sz, strat|VM_SLEEP);
1661 1.10 yamt }
1662 1.1 yamt printf("-> %" PRIu64 "\n", (uint64_t)p);
1663 1.1 yamt vmem_dump(vm);
1664 1.1 yamt if (p == VMEM_ADDR_NULL) {
1665 1.10 yamt if (x) {
1666 1.10 yamt continue;
1667 1.10 yamt }
1668 1.1 yamt break;
1669 1.1 yamt }
1670 1.1 yamt nreg++;
1671 1.1 yamt reg = realloc(reg, sizeof(*reg) * nreg);
1672 1.1 yamt r = ®[nreg - 1];
1673 1.1 yamt r->p = p;
1674 1.1 yamt r->sz = sz;
1675 1.10 yamt r->x = x;
1676 1.1 yamt total += sz;
1677 1.1 yamt nalloc++;
1678 1.1 yamt } else if (nreg != 0) {
1679 1.10 yamt /* free */
1680 1.1 yamt r = ®[rand() % nreg];
1681 1.1 yamt printf("=== free %" PRIu64 ", %" PRIu64 "\n",
1682 1.1 yamt (uint64_t)r->p, (uint64_t)r->sz);
1683 1.10 yamt if (r->x) {
1684 1.10 yamt vmem_xfree(vm, r->p, r->sz);
1685 1.10 yamt } else {
1686 1.10 yamt vmem_free(vm, r->p, r->sz);
1687 1.10 yamt }
1688 1.1 yamt total -= r->sz;
1689 1.1 yamt vmem_dump(vm);
1690 1.1 yamt *r = reg[nreg - 1];
1691 1.1 yamt nreg--;
1692 1.1 yamt nfree++;
1693 1.1 yamt }
1694 1.1 yamt printf("total=%" PRIu64 "\n", (uint64_t)total);
1695 1.1 yamt }
1696 1.1 yamt fprintf(stderr, "total=%" PRIu64 ", nalloc=%d, nfree=%d\n",
1697 1.1 yamt (uint64_t)total, nalloc, nfree);
1698 1.1 yamt exit(EXIT_SUCCESS);
1699 1.1 yamt }
1700 1.1 yamt #endif /* !defined(_KERNEL) */
1701 1.1 yamt #endif /* defined(VMEM_DEBUG) */
1702