uvm_km.c revision 1.1 1 1.1 mrg /* $Id: uvm_km.c,v 1.1 1998/02/05 06:25:10 mrg Exp $ */
2 1.1 mrg
3 1.1 mrg /*
4 1.1 mrg * XXXCDC: "ROUGH DRAFT" QUALITY UVM PRE-RELEASE FILE!
5 1.1 mrg * >>>USE AT YOUR OWN RISK, WORK IS NOT FINISHED<<<
6 1.1 mrg */
7 1.1 mrg /*
8 1.1 mrg * Copyright (c) 1997 Charles D. Cranor and Washington University.
9 1.1 mrg * Copyright (c) 1991, 1993, The Regents of the University of California.
10 1.1 mrg *
11 1.1 mrg * All rights reserved.
12 1.1 mrg *
13 1.1 mrg * This code is derived from software contributed to Berkeley by
14 1.1 mrg * The Mach Operating System project at Carnegie-Mellon University.
15 1.1 mrg *
16 1.1 mrg * Redistribution and use in source and binary forms, with or without
17 1.1 mrg * modification, are permitted provided that the following conditions
18 1.1 mrg * are met:
19 1.1 mrg * 1. Redistributions of source code must retain the above copyright
20 1.1 mrg * notice, this list of conditions and the following disclaimer.
21 1.1 mrg * 2. Redistributions in binary form must reproduce the above copyright
22 1.1 mrg * notice, this list of conditions and the following disclaimer in the
23 1.1 mrg * documentation and/or other materials provided with the distribution.
24 1.1 mrg * 3. All advertising materials mentioning features or use of this software
25 1.1 mrg * must display the following acknowledgement:
26 1.1 mrg * This product includes software developed by Charles D. Cranor,
27 1.1 mrg * Washington University, the University of California, Berkeley and
28 1.1 mrg * its contributors.
29 1.1 mrg * 4. Neither the name of the University nor the names of its contributors
30 1.1 mrg * may be used to endorse or promote products derived from this software
31 1.1 mrg * without specific prior written permission.
32 1.1 mrg *
33 1.1 mrg * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
34 1.1 mrg * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
35 1.1 mrg * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
36 1.1 mrg * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
37 1.1 mrg * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
38 1.1 mrg * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
39 1.1 mrg * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
40 1.1 mrg * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
41 1.1 mrg * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
42 1.1 mrg * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
43 1.1 mrg * SUCH DAMAGE.
44 1.1 mrg *
45 1.1 mrg * @(#)vm_kern.c 8.3 (Berkeley) 1/12/94
46 1.1 mrg *
47 1.1 mrg *
48 1.1 mrg * Copyright (c) 1987, 1990 Carnegie-Mellon University.
49 1.1 mrg * All rights reserved.
50 1.1 mrg *
51 1.1 mrg * Permission to use, copy, modify and distribute this software and
52 1.1 mrg * its documentation is hereby granted, provided that both the copyright
53 1.1 mrg * notice and this permission notice appear in all copies of the
54 1.1 mrg * software, derivative works or modified versions, and any portions
55 1.1 mrg * thereof, and that both notices appear in supporting documentation.
56 1.1 mrg *
57 1.1 mrg * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS"
58 1.1 mrg * CONDITION. CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND
59 1.1 mrg * FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
60 1.1 mrg *
61 1.1 mrg * Carnegie Mellon requests users of this software to return to
62 1.1 mrg *
63 1.1 mrg * Software Distribution Coordinator or Software.Distribution (at) CS.CMU.EDU
64 1.1 mrg * School of Computer Science
65 1.1 mrg * Carnegie Mellon University
66 1.1 mrg * Pittsburgh PA 15213-3890
67 1.1 mrg *
68 1.1 mrg * any improvements or extensions that they make and grant Carnegie the
69 1.1 mrg * rights to redistribute these changes.
70 1.1 mrg */
71 1.1 mrg
72 1.1 mrg /*
73 1.1 mrg * uvm_km.c: handle kernel memory allocation and management
74 1.1 mrg */
75 1.1 mrg
76 1.1 mrg #include <sys/param.h>
77 1.1 mrg #include <sys/systm.h>
78 1.1 mrg #include <sys/proc.h>
79 1.1 mrg
80 1.1 mrg #include <vm/vm.h>
81 1.1 mrg #include <vm/vm_page.h>
82 1.1 mrg #include <vm/vm_kern.h>
83 1.1 mrg
84 1.1 mrg #include <uvm/uvm.h>
85 1.1 mrg
86 1.1 mrg /*
87 1.1 mrg * global data structures
88 1.1 mrg */
89 1.1 mrg
90 1.1 mrg vm_map_t kernel_map = NULL;
91 1.1 mrg
92 1.1 mrg /*
93 1.1 mrg * local functions
94 1.1 mrg */
95 1.1 mrg
96 1.1 mrg static int uvm_km_get __P((struct uvm_object *, vm_offset_t,
97 1.1 mrg vm_page_t *, int *, int, vm_prot_t, int, int));
98 1.1 mrg /*
99 1.1 mrg * local data structues
100 1.1 mrg */
101 1.1 mrg
102 1.1 mrg static struct vm_map kernel_map_store;
103 1.1 mrg static struct uvm_object kernel_object_store;
104 1.1 mrg static struct uvm_object kmem_object_store;
105 1.1 mrg static struct uvm_object mb_object_store;
106 1.1 mrg
107 1.1 mrg static struct uvm_pagerops km_pager = {
108 1.1 mrg NULL, /* init */
109 1.1 mrg NULL, /* attach */
110 1.1 mrg NULL, /* reference */
111 1.1 mrg NULL, /* detach */
112 1.1 mrg NULL, /* fault */
113 1.1 mrg NULL, /* flush */
114 1.1 mrg uvm_km_get, /* get */
115 1.1 mrg /* ... rest are NULL */
116 1.1 mrg };
117 1.1 mrg
118 1.1 mrg /*
119 1.1 mrg * uvm_km_get: pager get function for kernel objects
120 1.1 mrg *
121 1.1 mrg * => currently we do not support pageout to the swap area, so this
122 1.1 mrg * pager is very simple. eventually we may want an anonymous
123 1.1 mrg * object pager which will do paging.
124 1.1 mrg */
125 1.1 mrg
126 1.1 mrg
127 1.1 mrg static int uvm_km_get(uobj, offset, pps, npagesp, centeridx, access_type,
128 1.1 mrg advice, flags)
129 1.1 mrg
130 1.1 mrg struct uvm_object *uobj;
131 1.1 mrg vm_offset_t offset;
132 1.1 mrg struct vm_page **pps;
133 1.1 mrg int *npagesp;
134 1.1 mrg int centeridx, advice, flags;
135 1.1 mrg vm_prot_t access_type;
136 1.1 mrg
137 1.1 mrg {
138 1.1 mrg vm_offset_t current_offset;
139 1.1 mrg vm_page_t ptmp;
140 1.1 mrg int lcv, gotpages, maxpages;
141 1.1 mrg boolean_t done;
142 1.1 mrg UVMHIST_FUNC("uvm_km_get"); UVMHIST_CALLED(maphist);
143 1.1 mrg
144 1.1 mrg UVMHIST_LOG(maphist, "flags=%d", flags,0,0,0);
145 1.1 mrg
146 1.1 mrg /*
147 1.1 mrg * get number of pages
148 1.1 mrg */
149 1.1 mrg
150 1.1 mrg maxpages = *npagesp;
151 1.1 mrg
152 1.1 mrg /*
153 1.1 mrg * step 1: handled the case where fault data structures are locked.
154 1.1 mrg */
155 1.1 mrg
156 1.1 mrg if (flags & PGO_LOCKED) {
157 1.1 mrg
158 1.1 mrg /*
159 1.1 mrg * step 1a: get pages that are already resident. only do this
160 1.1 mrg * if the data structures are locked (i.e. the first time through).
161 1.1 mrg */
162 1.1 mrg
163 1.1 mrg done = TRUE; /* be optimistic */
164 1.1 mrg gotpages = 0; /* # of pages we got so far */
165 1.1 mrg
166 1.1 mrg for (lcv = 0, current_offset = offset ;
167 1.1 mrg lcv < maxpages ; lcv++, current_offset += PAGE_SIZE) {
168 1.1 mrg
169 1.1 mrg /* do we care about this page? if not, skip it */
170 1.1 mrg if (pps[lcv] == PGO_DONTCARE)
171 1.1 mrg continue;
172 1.1 mrg
173 1.1 mrg /* lookup page */
174 1.1 mrg ptmp = uvm_pagelookup(uobj, current_offset);
175 1.1 mrg
176 1.1 mrg /* null? attempt to allocate the page */
177 1.1 mrg if (ptmp == NULL) {
178 1.1 mrg ptmp = uvm_pagealloc(uobj, current_offset, NULL);
179 1.1 mrg if (ptmp) {
180 1.1 mrg ptmp->flags &= ~(PG_BUSY|PG_FAKE); /* new page */
181 1.1 mrg UVM_PAGE_OWN(ptmp, NULL);
182 1.1 mrg ptmp->wire_count = 1; /* XXX: prevents pageout attempts */
183 1.1 mrg uvm_pagezero(ptmp);
184 1.1 mrg }
185 1.1 mrg }
186 1.1 mrg
187 1.1 mrg /* to be useful must get a non-busy, non-released page */
188 1.1 mrg if (ptmp == NULL || (ptmp->flags & (PG_BUSY|PG_RELEASED)) != 0) {
189 1.1 mrg if (lcv == centeridx || (flags & PGO_ALLPAGES) != 0)
190 1.1 mrg done = FALSE; /* need to do a wait or I/O! */
191 1.1 mrg continue;
192 1.1 mrg }
193 1.1 mrg
194 1.1 mrg /* useful page: busy/lock it and plug it in our result array */
195 1.1 mrg ptmp->flags |= PG_BUSY; /* caller must un-busy this page */
196 1.1 mrg UVM_PAGE_OWN(ptmp, "uvm_km_get1");
197 1.1 mrg pps[lcv] = ptmp;
198 1.1 mrg gotpages++;
199 1.1 mrg
200 1.1 mrg } /* "for" lcv loop */
201 1.1 mrg
202 1.1 mrg /*
203 1.1 mrg * step 1b: now we've either done everything needed or we to unlock
204 1.1 mrg * and do some waiting or I/O.
205 1.1 mrg */
206 1.1 mrg
207 1.1 mrg UVMHIST_LOG(maphist, "<- done (done=%d)", done, 0,0,0);
208 1.1 mrg
209 1.1 mrg *npagesp = gotpages;
210 1.1 mrg if (done)
211 1.1 mrg return(VM_PAGER_OK); /* bingo! */
212 1.1 mrg else
213 1.1 mrg return(VM_PAGER_UNLOCK); /* EEK! Need to unlock and I/O */
214 1.1 mrg }
215 1.1 mrg
216 1.1 mrg /*
217 1.1 mrg * step 2: get non-resident or busy pages.
218 1.1 mrg * object is locked. data structures are unlocked.
219 1.1 mrg */
220 1.1 mrg
221 1.1 mrg for (lcv = 0, current_offset = offset ;
222 1.1 mrg lcv < maxpages ; lcv++, current_offset += PAGE_SIZE) {
223 1.1 mrg
224 1.1 mrg /* skip over pages we've already gotten or don't want */
225 1.1 mrg /* skip over pages we don't _have_ to get */
226 1.1 mrg if (pps[lcv] != NULL ||
227 1.1 mrg (lcv != centeridx && (flags & PGO_ALLPAGES) == 0))
228 1.1 mrg continue;
229 1.1 mrg
230 1.1 mrg /*
231 1.1 mrg * we have yet to locate the current page (pps[lcv]). we first
232 1.1 mrg * look for a page that is already at the current offset. if we
233 1.1 mrg * find a page, we check to see if it is busy or released. if that
234 1.1 mrg * is the case, then we sleep on the page until it is no longer busy
235 1.1 mrg * or released and repeat the lookup. if the page we found is
236 1.1 mrg * neither busy nor released, then we busy it (so we own it) and
237 1.1 mrg * plug it into pps[lcv]. this 'break's the following while loop
238 1.1 mrg * and indicates we are ready to move on to the next page in the
239 1.1 mrg * "lcv" loop above.
240 1.1 mrg *
241 1.1 mrg * if we exit the while loop with pps[lcv] still set to NULL, then
242 1.1 mrg * it means that we allocated a new busy/fake/clean page ptmp in the
243 1.1 mrg * object and we need to do I/O to fill in the data.
244 1.1 mrg */
245 1.1 mrg
246 1.1 mrg while (pps[lcv] == NULL) { /* top of "pps" while loop */
247 1.1 mrg
248 1.1 mrg /* look for a current page */
249 1.1 mrg ptmp = uvm_pagelookup(uobj, current_offset);
250 1.1 mrg
251 1.1 mrg /* nope? allocate one now (if we can) */
252 1.1 mrg if (ptmp == NULL) {
253 1.1 mrg
254 1.1 mrg ptmp = uvm_pagealloc(uobj, current_offset, NULL); /* alloc */
255 1.1 mrg
256 1.1 mrg /* out of RAM? */
257 1.1 mrg if (ptmp == NULL) {
258 1.1 mrg simple_unlock(&uobj->vmobjlock);
259 1.1 mrg uvm_wait("kmgetwait1");
260 1.1 mrg simple_lock(&uobj->vmobjlock);
261 1.1 mrg continue; /* goto top of pps while loop */
262 1.1 mrg }
263 1.1 mrg
264 1.1 mrg /*
265 1.1 mrg * got new page ready for I/O. break pps while loop. pps[lcv] is
266 1.1 mrg * still NULL.
267 1.1 mrg */
268 1.1 mrg break;
269 1.1 mrg }
270 1.1 mrg
271 1.1 mrg /* page is there, see if we need to wait on it */
272 1.1 mrg if ((ptmp->flags & (PG_BUSY|PG_RELEASED)) != 0) {
273 1.1 mrg ptmp->flags |= PG_WANTED;
274 1.1 mrg UVM_UNLOCK_AND_WAIT(ptmp,&uobj->vmobjlock,0,"uvn_get",0);
275 1.1 mrg simple_lock(&uobj->vmobjlock);
276 1.1 mrg continue; /* goto top of pps while loop */
277 1.1 mrg }
278 1.1 mrg
279 1.1 mrg /*
280 1.1 mrg * if we get here then the page has become resident and unbusy
281 1.1 mrg * between steps 1 and 2. we busy it now (so we own it) and set
282 1.1 mrg * pps[lcv] (so that we exit the while loop).
283 1.1 mrg */
284 1.1 mrg ptmp->flags |= PG_BUSY; /* we own it, caller must un-busy */
285 1.1 mrg UVM_PAGE_OWN(ptmp, "uvm_km_get2");
286 1.1 mrg pps[lcv] = ptmp;
287 1.1 mrg }
288 1.1 mrg
289 1.1 mrg /*
290 1.1 mrg * if we own the a valid page at the correct offset, pps[lcv] will
291 1.1 mrg * point to it. nothing more to do except go to the next page.
292 1.1 mrg */
293 1.1 mrg
294 1.1 mrg if (pps[lcv])
295 1.1 mrg continue; /* next lcv */
296 1.1 mrg
297 1.1 mrg /*
298 1.1 mrg * we have a "fake/busy/clean" page that we just allocated.
299 1.1 mrg * do the needed "i/o" (in this case that means zero it).
300 1.1 mrg */
301 1.1 mrg
302 1.1 mrg uvm_pagezero(ptmp);
303 1.1 mrg ptmp->flags &= ~(PG_FAKE);
304 1.1 mrg ptmp->wire_count = 1; /* XXX: prevents pageout attempts */
305 1.1 mrg pps[lcv] = ptmp;
306 1.1 mrg
307 1.1 mrg } /* lcv loop */
308 1.1 mrg
309 1.1 mrg /*
310 1.1 mrg * finally, unlock object and return.
311 1.1 mrg */
312 1.1 mrg
313 1.1 mrg simple_unlock(&uobj->vmobjlock);
314 1.1 mrg UVMHIST_LOG(maphist, "<- done (OK)",0,0,0,0);
315 1.1 mrg return(VM_PAGER_OK);
316 1.1 mrg }
317 1.1 mrg
318 1.1 mrg /*
319 1.1 mrg * uvm_km_init: init kernel maps and objects to reflect reality (i.e.
320 1.1 mrg * KVM already allocated for text, data, bss, and static data structures).
321 1.1 mrg *
322 1.1 mrg * => KVM is defined by VM_MIN_KERNEL_ADDRESS/VM_MAX_KERNEL_ADDRESS.
323 1.1 mrg * we assume that [min -> start] has already been allocated and that
324 1.1 mrg * "end" is the end.
325 1.1 mrg */
326 1.1 mrg
327 1.1 mrg void uvm_km_init(start, end)
328 1.1 mrg
329 1.1 mrg vm_offset_t start, end;
330 1.1 mrg
331 1.1 mrg {
332 1.1 mrg vm_offset_t base = VM_MIN_KERNEL_ADDRESS;
333 1.1 mrg
334 1.1 mrg /*
335 1.1 mrg * first, init kernel memory objects.
336 1.1 mrg */
337 1.1 mrg
338 1.1 mrg /* kernel_object: for pageable anonymous kernel memory (eventually) */
339 1.1 mrg simple_lock_init(&kernel_object_store.vmobjlock);
340 1.1 mrg kernel_object_store.pgops = &km_pager;
341 1.1 mrg TAILQ_INIT(&kernel_object_store.memq);
342 1.1 mrg kernel_object_store.uo_npages = 0;
343 1.1 mrg kernel_object_store.uo_refs = UVM_OBJ_KERN;
344 1.1 mrg /* we are special. we never die */
345 1.1 mrg uvm.kernel_object = &kernel_object_store;
346 1.1 mrg
347 1.1 mrg /* kmem_object: for malloc'd memory (always wired) */
348 1.1 mrg simple_lock_init(&kmem_object_store.vmobjlock);
349 1.1 mrg kmem_object_store.pgops = &km_pager;
350 1.1 mrg TAILQ_INIT(&kmem_object_store.memq);
351 1.1 mrg kmem_object_store.uo_npages = 0;
352 1.1 mrg kmem_object_store.uo_refs = UVM_OBJ_KERN;
353 1.1 mrg /* we are special. we never die */
354 1.1 mrg uvmexp.kmem_object = &kmem_object_store;
355 1.1 mrg
356 1.1 mrg /* mb_object: for mbuf memory (always wired) */
357 1.1 mrg simple_lock_init(&mb_object_store.vmobjlock);
358 1.1 mrg mb_object_store.pgops = &km_pager;
359 1.1 mrg TAILQ_INIT(&mb_object_store.memq);
360 1.1 mrg mb_object_store.uo_npages = 0;
361 1.1 mrg mb_object_store.uo_refs = UVM_OBJ_KERN;
362 1.1 mrg /* we are special. we never die */
363 1.1 mrg uvmexp.mb_object = &mb_object_store;
364 1.1 mrg
365 1.1 mrg /*
366 1.1 mrg * init the map and reserve kernel space before installing.
367 1.1 mrg */
368 1.1 mrg
369 1.1 mrg uvm_map_setup(&kernel_map_store, base, end, FALSE);
370 1.1 mrg kernel_map_store.pmap = pmap_kernel();
371 1.1 mrg if (uvm_map(&kernel_map_store, &base, start - base, NULL, UVM_UNKNOWN_OFFSET,
372 1.1 mrg UVM_MAPFLAG(UVM_PROT_ALL, UVM_PROT_ALL, UVM_INH_NONE,
373 1.1 mrg UVM_ADV_RANDOM,UVM_FLAG_FIXED)) != KERN_SUCCESS)
374 1.1 mrg panic("uvm_km_init: could not reserve space for kernel");
375 1.1 mrg
376 1.1 mrg /*
377 1.1 mrg * install!
378 1.1 mrg */
379 1.1 mrg
380 1.1 mrg kernel_map = &kernel_map_store;
381 1.1 mrg }
382 1.1 mrg
383 1.1 mrg /*
384 1.1 mrg * uvm_km_suballoc: allocate a submap in the kernel map. once a submap
385 1.1 mrg * is allocated all references to that area of VM must go through it. this
386 1.1 mrg * allows the locking of VAs in kernel_map to be broken up into regions.
387 1.1 mrg *
388 1.1 mrg * => if submap is non NULL we use that as the submap, otherwise we
389 1.1 mrg * alloc a new map
390 1.1 mrg */
391 1.1 mrg
392 1.1 mrg struct vm_map *uvm_km_suballoc(map, min, max, size, pageable, submap)
393 1.1 mrg
394 1.1 mrg struct vm_map *map;
395 1.1 mrg vm_offset_t *min, *max; /* OUT, OUT */
396 1.1 mrg vm_size_t size;
397 1.1 mrg boolean_t pageable;
398 1.1 mrg struct vm_map *submap;
399 1.1 mrg
400 1.1 mrg {
401 1.1 mrg size = round_page(size); /* round up to pagesize */
402 1.1 mrg
403 1.1 mrg /*
404 1.1 mrg * first allocate a blank spot in the parent map
405 1.1 mrg */
406 1.1 mrg
407 1.1 mrg if (uvm_map(map, min, size, NULL, UVM_UNKNOWN_OFFSET,
408 1.1 mrg UVM_MAPFLAG(UVM_PROT_ALL, UVM_PROT_ALL, UVM_INH_NONE,
409 1.1 mrg UVM_ADV_RANDOM, UVM_FLAG_NOMERGE)) != KERN_SUCCESS) {
410 1.1 mrg panic("uvm_km_suballoc: unable to allocate space in parent map");
411 1.1 mrg }
412 1.1 mrg
413 1.1 mrg /*
414 1.1 mrg * set VM bounds (min is filled in by uvm_map)
415 1.1 mrg */
416 1.1 mrg
417 1.1 mrg *max = *min + size;
418 1.1 mrg
419 1.1 mrg /*
420 1.1 mrg * add references to pmap and create or init the submap
421 1.1 mrg */
422 1.1 mrg
423 1.1 mrg pmap_reference(vm_map_pmap(map));
424 1.1 mrg if (submap == NULL) {
425 1.1 mrg submap = uvm_map_create(vm_map_pmap(map), *min, *max, pageable);
426 1.1 mrg if (submap == NULL)
427 1.1 mrg panic("uvm_km_suballoc: unable to create submap");
428 1.1 mrg } else {
429 1.1 mrg uvm_map_setup(submap, *min, *max, pageable);
430 1.1 mrg submap->pmap = vm_map_pmap(map);
431 1.1 mrg }
432 1.1 mrg
433 1.1 mrg /*
434 1.1 mrg * now let uvm_map_submap plug in it...
435 1.1 mrg */
436 1.1 mrg
437 1.1 mrg if (uvm_map_submap(map, *min, *max, submap) != KERN_SUCCESS)
438 1.1 mrg panic("uvm_km_suballoc: submap allocation failed");
439 1.1 mrg
440 1.1 mrg return(submap);
441 1.1 mrg }
442 1.1 mrg
443 1.1 mrg /*
444 1.1 mrg * uvm_km_pgremove: remove pages from a kernel uvm_object.
445 1.1 mrg *
446 1.1 mrg * => when you unmap a part of anonymous kernel memory you want to toss
447 1.1 mrg * the pages right away. (this gets called from uvm_unmap_...).
448 1.1 mrg */
449 1.1 mrg
450 1.1 mrg #define UKM_HASH_PENALTY 4 /* a guess */
451 1.1 mrg
452 1.1 mrg void uvm_km_pgremove(uobj, start, end)
453 1.1 mrg
454 1.1 mrg struct uvm_object *uobj;
455 1.1 mrg vm_offset_t start, end;
456 1.1 mrg
457 1.1 mrg {
458 1.1 mrg boolean_t by_list;
459 1.1 mrg struct vm_page *pp, *ppnext;
460 1.1 mrg vm_offset_t curoff;
461 1.1 mrg UVMHIST_FUNC("uvm_km_pgremove"); UVMHIST_CALLED(maphist);
462 1.1 mrg
463 1.1 mrg simple_lock(&uobj->vmobjlock); /* lock object */
464 1.1 mrg
465 1.1 mrg /* choose cheapest traversal */
466 1.1 mrg by_list = (uobj->uo_npages <=
467 1.1 mrg ((end - start) / PAGE_SIZE) * UKM_HASH_PENALTY);
468 1.1 mrg
469 1.1 mrg if (by_list)
470 1.1 mrg goto loop_by_list;
471 1.1 mrg
472 1.1 mrg /* by hash */
473 1.1 mrg
474 1.1 mrg for (curoff = start ; curoff < end ; curoff += PAGE_SIZE) {
475 1.1 mrg pp = uvm_pagelookup(uobj, curoff);
476 1.1 mrg if (pp == NULL)
477 1.1 mrg continue;
478 1.1 mrg
479 1.1 mrg UVMHIST_LOG(maphist," page 0x%x, busy=%d", pp,pp->flags & PG_BUSY,0,0);
480 1.1 mrg /* now do the actual work */
481 1.1 mrg if (pp->flags & PG_BUSY)
482 1.1 mrg pp->flags |= PG_RELEASED; /* owner must check for this when done */
483 1.1 mrg else {
484 1.1 mrg pmap_page_protect(PMAP_PGARG(pp), VM_PROT_NONE);
485 1.1 mrg uvm_lock_pageq();
486 1.1 mrg uvm_pagefree(pp);
487 1.1 mrg uvm_unlock_pageq();
488 1.1 mrg }
489 1.1 mrg /* done */
490 1.1 mrg
491 1.1 mrg }
492 1.1 mrg simple_unlock(&uobj->vmobjlock);
493 1.1 mrg return;
494 1.1 mrg
495 1.1 mrg loop_by_list:
496 1.1 mrg
497 1.1 mrg for (pp = uobj->memq.tqh_first ; pp != NULL ; pp = ppnext) {
498 1.1 mrg
499 1.1 mrg ppnext = pp->listq.tqe_next;
500 1.1 mrg if (pp->offset < start || pp->offset >= end) {
501 1.1 mrg continue;
502 1.1 mrg }
503 1.1 mrg
504 1.1 mrg UVMHIST_LOG(maphist," page 0x%x, busy=%d", pp,pp->flags & PG_BUSY,0,0);
505 1.1 mrg /* now do the actual work */
506 1.1 mrg if (pp->flags & PG_BUSY)
507 1.1 mrg pp->flags |= PG_RELEASED; /* owner must check for this when done */
508 1.1 mrg else {
509 1.1 mrg pmap_page_protect(PMAP_PGARG(pp), VM_PROT_NONE);
510 1.1 mrg uvm_lock_pageq();
511 1.1 mrg uvm_pagefree(pp);
512 1.1 mrg uvm_unlock_pageq();
513 1.1 mrg }
514 1.1 mrg /* done */
515 1.1 mrg
516 1.1 mrg }
517 1.1 mrg simple_unlock(&uobj->vmobjlock);
518 1.1 mrg return;
519 1.1 mrg }
520 1.1 mrg
521 1.1 mrg
522 1.1 mrg /*
523 1.1 mrg * uvm_km_kmemalloc: lower level kernel memory allocator for malloc()
524 1.1 mrg *
525 1.1 mrg * => we map wired memory into the specified map using the obj passed in
526 1.1 mrg * => NOTE: we can return NULL even if we can wait if there is not enough
527 1.1 mrg * free VM space in the map... caller should be prepared to handle
528 1.1 mrg * this case.
529 1.1 mrg * => we return KVA of memory allocated
530 1.1 mrg * => flags: NOWAIT, VALLOC - just allocate VA, TRYLOCK - fail if we can't
531 1.1 mrg * lock the map
532 1.1 mrg */
533 1.1 mrg
534 1.1 mrg vm_offset_t uvm_km_kmemalloc(map, obj, size, flags)
535 1.1 mrg
536 1.1 mrg vm_map_t map;
537 1.1 mrg struct uvm_object *obj;
538 1.1 mrg vm_size_t size;
539 1.1 mrg int flags;
540 1.1 mrg
541 1.1 mrg {
542 1.1 mrg vm_offset_t kva, loopva;
543 1.1 mrg vm_offset_t offset;
544 1.1 mrg struct vm_page *pg;
545 1.1 mrg UVMHIST_FUNC("uvm_km_kmemalloc"); UVMHIST_CALLED(maphist);
546 1.1 mrg
547 1.1 mrg
548 1.1 mrg UVMHIST_LOG(maphist," (map=0x%x, obj=0x%x, size=0x%x, flags=%d)",
549 1.1 mrg map, obj, size, flags);
550 1.1 mrg #ifdef DIAGNOSTIC
551 1.1 mrg /* sanity check */
552 1.1 mrg if (vm_map_pmap(map) != pmap_kernel())
553 1.1 mrg panic("uvm_km_kmemalloc: invalid map");
554 1.1 mrg #endif
555 1.1 mrg
556 1.1 mrg /*
557 1.1 mrg * setup for call
558 1.1 mrg */
559 1.1 mrg
560 1.1 mrg size = round_page(size);
561 1.1 mrg kva = vm_map_min(map); /* hint */
562 1.1 mrg
563 1.1 mrg /*
564 1.1 mrg * allocate some virtual space
565 1.1 mrg */
566 1.1 mrg
567 1.1 mrg if (uvm_map(map, &kva, size, obj, UVM_UNKNOWN_OFFSET,
568 1.1 mrg UVM_MAPFLAG(UVM_PROT_ALL, UVM_PROT_ALL, UVM_INH_NONE,
569 1.1 mrg UVM_ADV_RANDOM, (flags & UVM_KMF_TRYLOCK)))
570 1.1 mrg != KERN_SUCCESS) {
571 1.1 mrg UVMHIST_LOG(maphist, "<- done (no VM)",0,0,0,0);
572 1.1 mrg return(0);
573 1.1 mrg }
574 1.1 mrg
575 1.1 mrg /*
576 1.1 mrg * if all we wanted was VA, return now
577 1.1 mrg */
578 1.1 mrg
579 1.1 mrg if (flags & UVM_KMF_VALLOC) {
580 1.1 mrg UVMHIST_LOG(maphist,"<- done valloc (kva=0x%x)", kva,0,0,0);
581 1.1 mrg return(kva);
582 1.1 mrg }
583 1.1 mrg /*
584 1.1 mrg * recover object offset from virtual address
585 1.1 mrg */
586 1.1 mrg
587 1.1 mrg offset = kva - vm_map_min(map);
588 1.1 mrg UVMHIST_LOG(maphist, " kva=0x%x, offset=0x%x", kva, offset,0,0);
589 1.1 mrg
590 1.1 mrg /*
591 1.1 mrg * now allocate and map in the memory... note that we are the only ones
592 1.1 mrg * whom should ever get a handle on this area of VM.
593 1.1 mrg */
594 1.1 mrg
595 1.1 mrg loopva = kva;
596 1.1 mrg while (size) {
597 1.1 mrg simple_lock(&obj->vmobjlock);
598 1.1 mrg pg = uvm_pagealloc(obj, offset, NULL);
599 1.1 mrg if (pg) {
600 1.1 mrg pg->flags &= ~PG_BUSY; /* new page */
601 1.1 mrg UVM_PAGE_OWN(pg, NULL);
602 1.1 mrg }
603 1.1 mrg simple_unlock(&obj->vmobjlock);
604 1.1 mrg
605 1.1 mrg /*
606 1.1 mrg * out of memory?
607 1.1 mrg */
608 1.1 mrg
609 1.1 mrg if (pg == NULL) {
610 1.1 mrg if (flags & UVM_KMF_NOWAIT) {
611 1.1 mrg uvm_unmap(map, kva, kva + size, 0); /* free everything! */
612 1.1 mrg return(0);
613 1.1 mrg } else {
614 1.1 mrg uvm_wait("km_getwait2"); /* sleep here */
615 1.1 mrg continue;
616 1.1 mrg }
617 1.1 mrg }
618 1.1 mrg
619 1.1 mrg /*
620 1.1 mrg * map it in: note that we call pmap_enter with the map and object
621 1.1 mrg * unlocked in case we are kmem_map/kmem_object (because if pmap_enter
622 1.1 mrg * wants to allocate out of kmem_object it will need to lock it itself!)
623 1.1 mrg */
624 1.1 mrg #if defined(PMAP_NEW)
625 1.1 mrg pmap_kenter_pa(loopva, VM_PAGE_TO_PHYS(pg), VM_PROT_ALL);
626 1.1 mrg #else
627 1.1 mrg pmap_enter(map->pmap, loopva, VM_PAGE_TO_PHYS(pg), UVM_PROT_ALL, TRUE);
628 1.1 mrg #endif
629 1.1 mrg loopva += PAGE_SIZE;
630 1.1 mrg offset += PAGE_SIZE;
631 1.1 mrg size -= PAGE_SIZE;
632 1.1 mrg }
633 1.1 mrg
634 1.1 mrg UVMHIST_LOG(maphist,"<- done (kva=0x%x)", kva,0,0,0);
635 1.1 mrg return(kva);
636 1.1 mrg }
637 1.1 mrg
638 1.1 mrg /*
639 1.1 mrg * uvm_km_free: free an area of kernel memory
640 1.1 mrg */
641 1.1 mrg
642 1.1 mrg void uvm_km_free(map, addr, size)
643 1.1 mrg
644 1.1 mrg vm_map_t map;
645 1.1 mrg vm_offset_t addr;
646 1.1 mrg vm_size_t size;
647 1.1 mrg
648 1.1 mrg {
649 1.1 mrg uvm_unmap(map, trunc_page(addr), round_page(addr+size), 1);
650 1.1 mrg }
651 1.1 mrg
652 1.1 mrg /*
653 1.1 mrg * uvm_km_free_wakeup: free an area of kernel memory and wake up
654 1.1 mrg * anyone waiting for vm space.
655 1.1 mrg *
656 1.1 mrg * => XXX: "wanted" bit + unlock&wait on other end?
657 1.1 mrg */
658 1.1 mrg
659 1.1 mrg void uvm_km_free_wakeup(map, addr, size)
660 1.1 mrg
661 1.1 mrg vm_map_t map;
662 1.1 mrg vm_offset_t addr;
663 1.1 mrg vm_size_t size;
664 1.1 mrg
665 1.1 mrg {
666 1.1 mrg vm_map_entry_t dead_entries;
667 1.1 mrg
668 1.1 mrg vm_map_lock(map);
669 1.1 mrg (void)uvm_unmap_remove(map, trunc_page(addr), round_page(addr+size), 1,
670 1.1 mrg &dead_entries);
671 1.1 mrg thread_wakeup(map);
672 1.1 mrg vm_map_unlock(map);
673 1.1 mrg
674 1.1 mrg if (dead_entries != NULL)
675 1.1 mrg uvm_unmap_detach(dead_entries, 0);
676 1.1 mrg }
677 1.1 mrg
678 1.1 mrg /*
679 1.1 mrg * uvm_km_alloc1: allocate wired down memory in the kernel map.
680 1.1 mrg *
681 1.1 mrg * => we can sleep if needed
682 1.1 mrg */
683 1.1 mrg
684 1.1 mrg vm_offset_t uvm_km_alloc1(map, size, zeroit)
685 1.1 mrg
686 1.1 mrg vm_map_t map;
687 1.1 mrg vm_size_t size;
688 1.1 mrg boolean_t zeroit;
689 1.1 mrg
690 1.1 mrg {
691 1.1 mrg vm_offset_t kva, loopva, offset;
692 1.1 mrg struct vm_page *pg;
693 1.1 mrg UVMHIST_FUNC("uvm_km_alloc1"); UVMHIST_CALLED(maphist);
694 1.1 mrg
695 1.1 mrg UVMHIST_LOG(maphist,"(map=0x%x, size=0x%x)", map, size,0,0);
696 1.1 mrg
697 1.1 mrg #ifdef DIAGNOSTIC
698 1.1 mrg if (vm_map_pmap(map) != pmap_kernel())
699 1.1 mrg panic("uvm_km_alloc1");
700 1.1 mrg #endif
701 1.1 mrg
702 1.1 mrg size = round_page(size);
703 1.1 mrg kva = vm_map_min(map); /* hint */
704 1.1 mrg
705 1.1 mrg /*
706 1.1 mrg * allocate some virtual space
707 1.1 mrg */
708 1.1 mrg
709 1.1 mrg if (uvm_map(map, &kva, size, uvm.kernel_object, UVM_UNKNOWN_OFFSET,
710 1.1 mrg UVM_MAPFLAG(UVM_PROT_ALL, UVM_PROT_ALL, UVM_INH_NONE,
711 1.1 mrg UVM_ADV_RANDOM, 0)) != KERN_SUCCESS) {
712 1.1 mrg UVMHIST_LOG(maphist,"<- done (no VM)",0,0,0,0);
713 1.1 mrg return(0);
714 1.1 mrg }
715 1.1 mrg
716 1.1 mrg /*
717 1.1 mrg * recover object offset from virtual address
718 1.1 mrg */
719 1.1 mrg
720 1.1 mrg offset = kva - vm_map_min(map);
721 1.1 mrg UVMHIST_LOG(maphist," kva=0x%x, offset=0x%x", kva, offset,0,0);
722 1.1 mrg
723 1.1 mrg /*
724 1.1 mrg * now allocate the memory. we must be careful about released pages.
725 1.1 mrg */
726 1.1 mrg
727 1.1 mrg loopva = kva;
728 1.1 mrg while (size) {
729 1.1 mrg simple_lock(&uvm.kernel_object->vmobjlock);
730 1.1 mrg pg = uvm_pagelookup(uvm.kernel_object, offset);
731 1.1 mrg
732 1.1 mrg /* if we found a page in an unallocated region, it must be released */
733 1.1 mrg if (pg) {
734 1.1 mrg if ((pg->flags & PG_RELEASED) == 0)
735 1.1 mrg panic("uvm_km_alloc1: non-released page");
736 1.1 mrg pg->flags |= PG_WANTED;
737 1.1 mrg UVM_UNLOCK_AND_WAIT(pg, &uvm.kernel_object->vmobjlock,0,"km_alloc",0);
738 1.1 mrg continue; /* retry */
739 1.1 mrg }
740 1.1 mrg
741 1.1 mrg /* allocate ram */
742 1.1 mrg pg = uvm_pagealloc(uvm.kernel_object, offset, NULL);
743 1.1 mrg if (pg) {
744 1.1 mrg pg->flags &= ~PG_BUSY; /* new page */
745 1.1 mrg UVM_PAGE_OWN(pg, NULL);
746 1.1 mrg }
747 1.1 mrg simple_unlock(&uvm.kernel_object->vmobjlock);
748 1.1 mrg if (pg == NULL) {
749 1.1 mrg uvm_wait("km_alloc1w"); /* wait for memory */
750 1.1 mrg continue;
751 1.1 mrg }
752 1.1 mrg
753 1.1 mrg /* map it in */
754 1.1 mrg #if defined(PMAP_NEW)
755 1.1 mrg pmap_kenter_pa(loopva, VM_PAGE_TO_PHYS(pg), UVM_PROT_ALL);
756 1.1 mrg #else
757 1.1 mrg pmap_enter(map->pmap, loopva, VM_PAGE_TO_PHYS(pg), UVM_PROT_ALL, TRUE);
758 1.1 mrg #endif
759 1.1 mrg loopva += PAGE_SIZE;
760 1.1 mrg offset += PAGE_SIZE;
761 1.1 mrg size -= PAGE_SIZE;
762 1.1 mrg }
763 1.1 mrg
764 1.1 mrg /*
765 1.1 mrg * zero on request (note that "size" is now zero due to the above loop
766 1.1 mrg * so we need to subtract kva from loopva to reconstruct the size).
767 1.1 mrg */
768 1.1 mrg
769 1.1 mrg if (zeroit)
770 1.1 mrg bzero((caddr_t)kva, loopva - kva);
771 1.1 mrg
772 1.1 mrg UVMHIST_LOG(maphist,"<- done (kva=0x%x)", kva,0,0,0);
773 1.1 mrg return(kva);
774 1.1 mrg }
775 1.1 mrg
776 1.1 mrg /*
777 1.1 mrg * uvm_km_valloc: allocate zero-fill memory in the kernel's address space
778 1.1 mrg *
779 1.1 mrg * => memory is not allocated until fault time
780 1.1 mrg */
781 1.1 mrg
782 1.1 mrg vm_offset_t uvm_km_valloc(map, size)
783 1.1 mrg
784 1.1 mrg vm_map_t map;
785 1.1 mrg vm_size_t size;
786 1.1 mrg
787 1.1 mrg {
788 1.1 mrg vm_offset_t kva;
789 1.1 mrg UVMHIST_FUNC("uvm_km_valloc"); UVMHIST_CALLED(maphist);
790 1.1 mrg
791 1.1 mrg UVMHIST_LOG(maphist, "(map=0x%x, size=0x%x)", map, size, 0,0);
792 1.1 mrg
793 1.1 mrg #ifdef DIAGNOSTIC
794 1.1 mrg if (vm_map_pmap(map) != pmap_kernel())
795 1.1 mrg panic("uvm_km_valloc");
796 1.1 mrg #endif
797 1.1 mrg
798 1.1 mrg size = round_page(size);
799 1.1 mrg kva = vm_map_min(map); /* hint */
800 1.1 mrg
801 1.1 mrg /*
802 1.1 mrg * allocate some virtual space. will be demand filled by kernel_object.
803 1.1 mrg */
804 1.1 mrg
805 1.1 mrg if (uvm_map(map, &kva, size, uvm.kernel_object, UVM_UNKNOWN_OFFSET,
806 1.1 mrg UVM_MAPFLAG(UVM_PROT_ALL, UVM_PROT_ALL, UVM_INH_NONE,
807 1.1 mrg UVM_ADV_RANDOM, 0)) != KERN_SUCCESS) {
808 1.1 mrg UVMHIST_LOG(maphist, "<- done (no VM)", 0,0,0,0);
809 1.1 mrg return(0);
810 1.1 mrg }
811 1.1 mrg
812 1.1 mrg UVMHIST_LOG(maphist, "<- done (kva=0x%x)", kva,0,0,0);
813 1.1 mrg return(kva);
814 1.1 mrg }
815 1.1 mrg
816 1.1 mrg /*
817 1.1 mrg * uvm_km_valloc_wait: allocate zero-fill memory in the kernel's address space
818 1.1 mrg *
819 1.1 mrg * => memory is not allocated until fault time
820 1.1 mrg * => if no room in map, wait for space to free, unless requested size
821 1.1 mrg * is larger than map (in which case we return 0)
822 1.1 mrg */
823 1.1 mrg
824 1.1 mrg vm_offset_t uvm_km_valloc_wait(map, size)
825 1.1 mrg
826 1.1 mrg vm_map_t map;
827 1.1 mrg vm_size_t size;
828 1.1 mrg
829 1.1 mrg {
830 1.1 mrg vm_offset_t kva;
831 1.1 mrg UVMHIST_FUNC("uvm_km_valloc_wait"); UVMHIST_CALLED(maphist);
832 1.1 mrg
833 1.1 mrg UVMHIST_LOG(maphist, "(map=0x%x, size=0x%x)", map, size, 0,0);
834 1.1 mrg
835 1.1 mrg #ifdef DIAGNOSTIC
836 1.1 mrg if (vm_map_pmap(map) != pmap_kernel())
837 1.1 mrg panic("uvm_km_valloc_wait");
838 1.1 mrg #endif
839 1.1 mrg
840 1.1 mrg size = round_page(size);
841 1.1 mrg if (size > vm_map_max(map) - vm_map_min(map))
842 1.1 mrg return(0);
843 1.1 mrg
844 1.1 mrg while (1) {
845 1.1 mrg kva = vm_map_min(map); /* hint */
846 1.1 mrg
847 1.1 mrg /*
848 1.1 mrg * allocate some virtual space. will be demand filled by kernel_object.
849 1.1 mrg */
850 1.1 mrg
851 1.1 mrg if (uvm_map(map, &kva, size, uvm.kernel_object, UVM_UNKNOWN_OFFSET,
852 1.1 mrg UVM_MAPFLAG(UVM_PROT_ALL, UVM_PROT_ALL, UVM_INH_NONE,
853 1.1 mrg UVM_ADV_RANDOM, 0)) == KERN_SUCCESS){
854 1.1 mrg UVMHIST_LOG(maphist,"<- done (kva=0x%x)", kva,0,0,0);
855 1.1 mrg return(kva);
856 1.1 mrg }
857 1.1 mrg
858 1.1 mrg /*
859 1.1 mrg * failed. sleep for a while (on map)
860 1.1 mrg */
861 1.1 mrg
862 1.1 mrg UVMHIST_LOG(maphist,"<<<sleeping>>>",0,0,0,0);
863 1.1 mrg tsleep((caddr_t)map, PVM, "vallocwait", 0);
864 1.1 mrg }
865 1.1 mrg /*NOTREACHED*/
866 1.1 mrg }
867