uvm_anon.c revision 1.19 1 1.19 chs /* $NetBSD: uvm_anon.c,v 1.19 2001/10/21 00:04:42 chs Exp $ */
2 1.1 chuck
3 1.1 chuck /*
4 1.1 chuck *
5 1.1 chuck * Copyright (c) 1997 Charles D. Cranor and Washington University.
6 1.1 chuck * All rights reserved.
7 1.1 chuck *
8 1.1 chuck * Redistribution and use in source and binary forms, with or without
9 1.1 chuck * modification, are permitted provided that the following conditions
10 1.1 chuck * are met:
11 1.1 chuck * 1. Redistributions of source code must retain the above copyright
12 1.1 chuck * notice, this list of conditions and the following disclaimer.
13 1.1 chuck * 2. Redistributions in binary form must reproduce the above copyright
14 1.1 chuck * notice, this list of conditions and the following disclaimer in the
15 1.1 chuck * documentation and/or other materials provided with the distribution.
16 1.1 chuck * 3. All advertising materials mentioning features or use of this software
17 1.1 chuck * must display the following acknowledgement:
18 1.1 chuck * This product includes software developed by Charles D. Cranor and
19 1.1 chuck * Washington University.
20 1.1 chuck * 4. The name of the author may not be used to endorse or promote products
21 1.1 chuck * derived from this software without specific prior written permission.
22 1.1 chuck *
23 1.1 chuck * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
24 1.1 chuck * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
25 1.1 chuck * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
26 1.1 chuck * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
27 1.1 chuck * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
28 1.1 chuck * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
29 1.1 chuck * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
30 1.1 chuck * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
31 1.1 chuck * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
32 1.1 chuck * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
33 1.1 chuck */
34 1.1 chuck
35 1.1 chuck /*
36 1.1 chuck * uvm_anon.c: uvm anon ops
37 1.1 chuck */
38 1.1 chuck
39 1.1 chuck #include "opt_uvmhist.h"
40 1.1 chuck
41 1.1 chuck #include <sys/param.h>
42 1.1 chuck #include <sys/systm.h>
43 1.1 chuck #include <sys/proc.h>
44 1.1 chuck #include <sys/malloc.h>
45 1.1 chuck #include <sys/pool.h>
46 1.5 chs #include <sys/kernel.h>
47 1.1 chuck
48 1.1 chuck #include <uvm/uvm.h>
49 1.1 chuck #include <uvm/uvm_swap.h>
50 1.1 chuck
51 1.1 chuck /*
52 1.5 chs * anonblock_list: global list of anon blocks,
53 1.5 chs * locked by swap_syscall_lock (since we never remove
54 1.5 chs * anything from this list and we only add to it via swapctl(2)).
55 1.5 chs */
56 1.5 chs
57 1.5 chs struct uvm_anonblock {
58 1.5 chs LIST_ENTRY(uvm_anonblock) list;
59 1.5 chs int count;
60 1.5 chs struct vm_anon *anons;
61 1.5 chs };
62 1.5 chs static LIST_HEAD(anonlist, uvm_anonblock) anonblock_list;
63 1.5 chs
64 1.5 chs
65 1.5 chs static boolean_t anon_pagein __P((struct vm_anon *));
66 1.5 chs
67 1.5 chs
68 1.5 chs /*
69 1.1 chuck * allocate anons
70 1.1 chuck */
71 1.1 chuck void
72 1.1 chuck uvm_anon_init()
73 1.1 chuck {
74 1.1 chuck int nanon = uvmexp.free - (uvmexp.free / 16); /* XXXCDC ??? */
75 1.5 chs
76 1.5 chs simple_lock_init(&uvm.afreelock);
77 1.5 chs LIST_INIT(&anonblock_list);
78 1.1 chuck
79 1.1 chuck /*
80 1.1 chuck * Allocate the initial anons.
81 1.1 chuck */
82 1.5 chs uvm_anon_add(nanon);
83 1.1 chuck }
84 1.1 chuck
85 1.1 chuck /*
86 1.1 chuck * add some more anons to the free pool. called when we add
87 1.1 chuck * more swap space.
88 1.5 chs *
89 1.5 chs * => swap_syscall_lock should be held (protects anonblock_list).
90 1.1 chuck */
91 1.11 chs int
92 1.5 chs uvm_anon_add(count)
93 1.5 chs int count;
94 1.1 chuck {
95 1.5 chs struct uvm_anonblock *anonblock;
96 1.1 chuck struct vm_anon *anon;
97 1.5 chs int lcv, needed;
98 1.1 chuck
99 1.5 chs simple_lock(&uvm.afreelock);
100 1.5 chs uvmexp.nanonneeded += count;
101 1.5 chs needed = uvmexp.nanonneeded - uvmexp.nanon;
102 1.5 chs simple_unlock(&uvm.afreelock);
103 1.5 chs
104 1.5 chs if (needed <= 0) {
105 1.11 chs return 0;
106 1.5 chs }
107 1.5 chs anon = (void *)uvm_km_alloc(kernel_map, sizeof(*anon) * needed);
108 1.11 chs if (anon == NULL) {
109 1.11 chs simple_lock(&uvm.afreelock);
110 1.11 chs uvmexp.nanonneeded -= count;
111 1.11 chs simple_unlock(&uvm.afreelock);
112 1.11 chs return ENOMEM;
113 1.1 chuck }
114 1.11 chs MALLOC(anonblock, void *, sizeof(*anonblock), M_UVMAMAP, M_WAITOK);
115 1.1 chuck
116 1.5 chs anonblock->count = needed;
117 1.5 chs anonblock->anons = anon;
118 1.5 chs LIST_INSERT_HEAD(&anonblock_list, anonblock, list);
119 1.5 chs memset(anon, 0, sizeof(*anon) * needed);
120 1.17 chs
121 1.1 chuck simple_lock(&uvm.afreelock);
122 1.5 chs uvmexp.nanon += needed;
123 1.5 chs uvmexp.nfreeanon += needed;
124 1.5 chs for (lcv = 0; lcv < needed; lcv++) {
125 1.1 chuck simple_lock_init(&anon->an_lock);
126 1.1 chuck anon[lcv].u.an_nxt = uvm.afree;
127 1.1 chuck uvm.afree = &anon[lcv];
128 1.3 ross simple_lock_init(&uvm.afree->an_lock);
129 1.1 chuck }
130 1.1 chuck simple_unlock(&uvm.afreelock);
131 1.11 chs return 0;
132 1.1 chuck }
133 1.1 chuck
134 1.1 chuck /*
135 1.5 chs * remove anons from the free pool.
136 1.5 chs */
137 1.5 chs void
138 1.5 chs uvm_anon_remove(count)
139 1.5 chs int count;
140 1.5 chs {
141 1.5 chs /*
142 1.5 chs * we never actually free any anons, to avoid allocation overhead.
143 1.5 chs * XXX someday we might want to try to free anons.
144 1.5 chs */
145 1.5 chs
146 1.5 chs simple_lock(&uvm.afreelock);
147 1.5 chs uvmexp.nanonneeded -= count;
148 1.5 chs simple_unlock(&uvm.afreelock);
149 1.5 chs }
150 1.5 chs
151 1.5 chs /*
152 1.1 chuck * allocate an anon
153 1.13 thorpej *
154 1.13 thorpej * => new anon is returned locked!
155 1.1 chuck */
156 1.1 chuck struct vm_anon *
157 1.1 chuck uvm_analloc()
158 1.1 chuck {
159 1.1 chuck struct vm_anon *a;
160 1.1 chuck
161 1.1 chuck simple_lock(&uvm.afreelock);
162 1.1 chuck a = uvm.afree;
163 1.1 chuck if (a) {
164 1.1 chuck uvm.afree = a->u.an_nxt;
165 1.1 chuck uvmexp.nfreeanon--;
166 1.1 chuck a->an_ref = 1;
167 1.1 chuck a->an_swslot = 0;
168 1.1 chuck a->u.an_page = NULL; /* so we can free quickly */
169 1.13 thorpej LOCK_ASSERT(simple_lock_held(&a->an_lock) == 0);
170 1.13 thorpej simple_lock(&a->an_lock);
171 1.1 chuck }
172 1.1 chuck simple_unlock(&uvm.afreelock);
173 1.1 chuck return(a);
174 1.1 chuck }
175 1.1 chuck
176 1.1 chuck /*
177 1.1 chuck * uvm_anfree: free a single anon structure
178 1.1 chuck *
179 1.1 chuck * => caller must remove anon from its amap before calling (if it was in
180 1.1 chuck * an amap).
181 1.1 chuck * => anon must be unlocked and have a zero reference count.
182 1.1 chuck * => we may lock the pageq's.
183 1.1 chuck */
184 1.1 chuck void
185 1.1 chuck uvm_anfree(anon)
186 1.1 chuck struct vm_anon *anon;
187 1.1 chuck {
188 1.1 chuck struct vm_page *pg;
189 1.1 chuck UVMHIST_FUNC("uvm_anfree"); UVMHIST_CALLED(maphist);
190 1.1 chuck UVMHIST_LOG(maphist,"(anon=0x%x)", anon, 0,0,0);
191 1.1 chuck
192 1.12 thorpej KASSERT(anon->an_ref == 0);
193 1.18 chs LOCK_ASSERT(!simple_lock_held(&anon->an_lock));
194 1.12 thorpej
195 1.1 chuck /*
196 1.1 chuck * get page
197 1.1 chuck */
198 1.1 chuck
199 1.1 chuck pg = anon->u.an_page;
200 1.1 chuck
201 1.1 chuck /*
202 1.1 chuck * if there is a resident page and it is loaned, then anon may not
203 1.1 chuck * own it. call out to uvm_anon_lockpage() to ensure the real owner
204 1.1 chuck * of the page has been identified and locked.
205 1.1 chuck */
206 1.1 chuck
207 1.1 chuck if (pg && pg->loan_count)
208 1.1 chuck pg = uvm_anon_lockloanpg(anon);
209 1.1 chuck
210 1.1 chuck /*
211 1.1 chuck * if we have a resident page, we must dispose of it before freeing
212 1.1 chuck * the anon.
213 1.1 chuck */
214 1.1 chuck
215 1.1 chuck if (pg) {
216 1.1 chuck
217 1.1 chuck /*
218 1.17 chs * if the page is owned by a uobject (now locked), then we must
219 1.1 chuck * kill the loan on the page rather than free it.
220 1.1 chuck */
221 1.1 chuck
222 1.1 chuck if (pg->uobject) {
223 1.1 chuck uvm_lock_pageq();
224 1.10 chs KASSERT(pg->loan_count > 0);
225 1.1 chuck pg->loan_count--;
226 1.1 chuck pg->uanon = NULL;
227 1.1 chuck uvm_unlock_pageq();
228 1.1 chuck simple_unlock(&pg->uobject->vmobjlock);
229 1.1 chuck } else {
230 1.1 chuck
231 1.1 chuck /*
232 1.1 chuck * page has no uobject, so we must be the owner of it.
233 1.18 chs * if page is busy then we wait until it is not busy,
234 1.18 chs * and then free it.
235 1.1 chuck */
236 1.1 chuck
237 1.18 chs KASSERT((pg->flags & PG_RELEASED) == 0);
238 1.19 chs simple_lock(&anon->an_lock);
239 1.18 chs pmap_page_protect(pg, VM_PROT_NONE);
240 1.18 chs while ((pg = anon->u.an_page) &&
241 1.18 chs (pg->flags & PG_BUSY) != 0) {
242 1.18 chs pg->flags |= PG_WANTED;
243 1.18 chs UVM_UNLOCK_AND_WAIT(pg, &anon->an_lock, 0,
244 1.18 chs "anfree", 0);
245 1.18 chs simple_lock(&anon->an_lock);
246 1.18 chs }
247 1.18 chs if (pg) {
248 1.18 chs uvm_lock_pageq();
249 1.18 chs uvm_pagefree(pg);
250 1.18 chs uvm_unlock_pageq();
251 1.17 chs }
252 1.19 chs simple_unlock(&anon->an_lock);
253 1.18 chs UVMHIST_LOG(maphist, "anon 0x%x, page 0x%x: "
254 1.18 chs "freed now!", anon, pg, 0, 0);
255 1.1 chuck }
256 1.1 chuck }
257 1.1 chuck
258 1.1 chuck /*
259 1.2 chs * free any swap resources.
260 1.1 chuck */
261 1.18 chs
262 1.2 chs uvm_anon_dropswap(anon);
263 1.1 chuck
264 1.1 chuck /*
265 1.18 chs * now that we've stripped the data areas from the anon,
266 1.18 chs * free the anon itself.
267 1.1 chuck */
268 1.18 chs
269 1.1 chuck simple_lock(&uvm.afreelock);
270 1.1 chuck anon->u.an_nxt = uvm.afree;
271 1.1 chuck uvm.afree = anon;
272 1.1 chuck uvmexp.nfreeanon++;
273 1.1 chuck simple_unlock(&uvm.afreelock);
274 1.1 chuck UVMHIST_LOG(maphist,"<- done!",0,0,0,0);
275 1.2 chs }
276 1.2 chs
277 1.2 chs /*
278 1.2 chs * uvm_anon_dropswap: release any swap resources from this anon.
279 1.17 chs *
280 1.2 chs * => anon must be locked or have a reference count of 0.
281 1.2 chs */
282 1.2 chs void
283 1.2 chs uvm_anon_dropswap(anon)
284 1.2 chs struct vm_anon *anon;
285 1.2 chs {
286 1.2 chs UVMHIST_FUNC("uvm_anon_dropswap"); UVMHIST_CALLED(maphist);
287 1.12 thorpej
288 1.12 thorpej if (anon->an_swslot == 0)
289 1.2 chs return;
290 1.2 chs
291 1.2 chs UVMHIST_LOG(maphist,"freeing swap for anon %p, paged to swslot 0x%x",
292 1.2 chs anon, anon->an_swslot, 0, 0);
293 1.2 chs uvm_swap_free(anon->an_swslot, 1);
294 1.2 chs anon->an_swslot = 0;
295 1.2 chs
296 1.2 chs if (anon->u.an_page == NULL) {
297 1.2 chs /* this page is no longer only in swap. */
298 1.2 chs simple_lock(&uvm.swap_data_lock);
299 1.2 chs uvmexp.swpgonly--;
300 1.2 chs simple_unlock(&uvm.swap_data_lock);
301 1.17 chs }
302 1.1 chuck }
303 1.1 chuck
304 1.1 chuck /*
305 1.1 chuck * uvm_anon_lockloanpg: given a locked anon, lock its resident page
306 1.1 chuck *
307 1.1 chuck * => anon is locked by caller
308 1.1 chuck * => on return: anon is locked
309 1.1 chuck * if there is a resident page:
310 1.1 chuck * if it has a uobject, it is locked by us
311 1.1 chuck * if it is ownerless, we take over as owner
312 1.1 chuck * we return the resident page (it can change during
313 1.1 chuck * this function)
314 1.1 chuck * => note that the only time an anon has an ownerless resident page
315 1.1 chuck * is if the page was loaned from a uvm_object and the uvm_object
316 1.1 chuck * disowned it
317 1.1 chuck * => this only needs to be called when you want to do an operation
318 1.1 chuck * on an anon's resident page and that page has a non-zero loan
319 1.1 chuck * count.
320 1.1 chuck */
321 1.1 chuck struct vm_page *
322 1.1 chuck uvm_anon_lockloanpg(anon)
323 1.1 chuck struct vm_anon *anon;
324 1.1 chuck {
325 1.1 chuck struct vm_page *pg;
326 1.1 chuck boolean_t locked = FALSE;
327 1.1 chuck
328 1.12 thorpej LOCK_ASSERT(simple_lock_held(&anon->an_lock));
329 1.12 thorpej
330 1.1 chuck /*
331 1.1 chuck * loop while we have a resident page that has a non-zero loan count.
332 1.1 chuck * if we successfully get our lock, we will "break" the loop.
333 1.1 chuck * note that the test for pg->loan_count is not protected -- this
334 1.1 chuck * may produce false positive results. note that a false positive
335 1.1 chuck * result may cause us to do more work than we need to, but it will
336 1.1 chuck * not produce an incorrect result.
337 1.1 chuck */
338 1.1 chuck
339 1.1 chuck while (((pg = anon->u.an_page) != NULL) && pg->loan_count != 0) {
340 1.1 chuck
341 1.1 chuck /*
342 1.1 chuck * quickly check to see if the page has an object before
343 1.1 chuck * bothering to lock the page queues. this may also produce
344 1.1 chuck * a false positive result, but that's ok because we do a real
345 1.1 chuck * check after that.
346 1.1 chuck */
347 1.1 chuck
348 1.1 chuck if (pg->uobject) {
349 1.1 chuck uvm_lock_pageq();
350 1.18 chs if (pg->uobject) {
351 1.1 chuck locked =
352 1.1 chuck simple_lock_try(&pg->uobject->vmobjlock);
353 1.1 chuck } else {
354 1.1 chuck /* object disowned before we got PQ lock */
355 1.1 chuck locked = TRUE;
356 1.1 chuck }
357 1.1 chuck uvm_unlock_pageq();
358 1.1 chuck
359 1.1 chuck /*
360 1.1 chuck * if we didn't get a lock (try lock failed), then we
361 1.1 chuck * toggle our anon lock and try again
362 1.1 chuck */
363 1.1 chuck
364 1.1 chuck if (!locked) {
365 1.1 chuck simple_unlock(&anon->an_lock);
366 1.10 chs
367 1.1 chuck /*
368 1.1 chuck * someone locking the object has a chance to
369 1.1 chuck * lock us right now
370 1.1 chuck */
371 1.10 chs
372 1.1 chuck simple_lock(&anon->an_lock);
373 1.10 chs continue;
374 1.1 chuck }
375 1.1 chuck }
376 1.1 chuck
377 1.1 chuck /*
378 1.1 chuck * if page is un-owned [i.e. the object dropped its ownership],
379 1.1 chuck * then we can take over as owner!
380 1.1 chuck */
381 1.1 chuck
382 1.1 chuck if (pg->uobject == NULL && (pg->pqflags & PQ_ANON) == 0) {
383 1.1 chuck uvm_lock_pageq();
384 1.18 chs pg->pqflags |= PQ_ANON;
385 1.18 chs pg->loan_count--;
386 1.1 chuck uvm_unlock_pageq();
387 1.1 chuck }
388 1.1 chuck break;
389 1.1 chuck }
390 1.1 chuck return(pg);
391 1.5 chs }
392 1.5 chs
393 1.5 chs
394 1.5 chs
395 1.5 chs /*
396 1.5 chs * page in every anon that is paged out to a range of swslots.
397 1.17 chs *
398 1.5 chs * swap_syscall_lock should be held (protects anonblock_list).
399 1.5 chs */
400 1.5 chs
401 1.5 chs boolean_t
402 1.5 chs anon_swap_off(startslot, endslot)
403 1.5 chs int startslot, endslot;
404 1.5 chs {
405 1.5 chs struct uvm_anonblock *anonblock;
406 1.5 chs
407 1.18 chs LIST_FOREACH(anonblock, &anonblock_list, list) {
408 1.5 chs int i;
409 1.5 chs
410 1.5 chs /*
411 1.5 chs * loop thru all the anons in the anonblock,
412 1.5 chs * paging in where needed.
413 1.5 chs */
414 1.5 chs
415 1.5 chs for (i = 0; i < anonblock->count; i++) {
416 1.5 chs struct vm_anon *anon = &anonblock->anons[i];
417 1.5 chs int slot;
418 1.5 chs
419 1.5 chs /*
420 1.5 chs * lock anon to work on it.
421 1.5 chs */
422 1.5 chs
423 1.5 chs simple_lock(&anon->an_lock);
424 1.5 chs
425 1.5 chs /*
426 1.5 chs * is this anon's swap slot in range?
427 1.5 chs */
428 1.5 chs
429 1.5 chs slot = anon->an_swslot;
430 1.5 chs if (slot >= startslot && slot < endslot) {
431 1.5 chs boolean_t rv;
432 1.5 chs
433 1.5 chs /*
434 1.5 chs * yup, page it in.
435 1.5 chs */
436 1.5 chs
437 1.5 chs /* locked: anon */
438 1.5 chs rv = anon_pagein(anon);
439 1.5 chs /* unlocked: anon */
440 1.5 chs
441 1.5 chs if (rv) {
442 1.5 chs return rv;
443 1.5 chs }
444 1.5 chs } else {
445 1.5 chs
446 1.5 chs /*
447 1.5 chs * nope, unlock and proceed.
448 1.5 chs */
449 1.5 chs
450 1.5 chs simple_unlock(&anon->an_lock);
451 1.5 chs }
452 1.5 chs }
453 1.5 chs }
454 1.5 chs return FALSE;
455 1.5 chs }
456 1.5 chs
457 1.5 chs
458 1.5 chs /*
459 1.5 chs * fetch an anon's page.
460 1.5 chs *
461 1.5 chs * => anon must be locked, and is unlocked upon return.
462 1.5 chs * => returns TRUE if pagein was aborted due to lack of memory.
463 1.5 chs */
464 1.5 chs
465 1.5 chs static boolean_t
466 1.5 chs anon_pagein(anon)
467 1.5 chs struct vm_anon *anon;
468 1.5 chs {
469 1.5 chs struct vm_page *pg;
470 1.5 chs struct uvm_object *uobj;
471 1.5 chs int rv;
472 1.8 thorpej
473 1.5 chs /* locked: anon */
474 1.12 thorpej LOCK_ASSERT(simple_lock_held(&anon->an_lock));
475 1.12 thorpej
476 1.5 chs rv = uvmfault_anonget(NULL, NULL, anon);
477 1.12 thorpej
478 1.8 thorpej /*
479 1.16 chs * if rv == 0, anon is still locked, else anon
480 1.8 thorpej * is unlocked
481 1.8 thorpej */
482 1.5 chs
483 1.5 chs switch (rv) {
484 1.16 chs case 0:
485 1.5 chs break;
486 1.5 chs
487 1.16 chs case EIO:
488 1.16 chs case ERESTART:
489 1.5 chs
490 1.5 chs /*
491 1.5 chs * nothing more to do on errors.
492 1.16 chs * ERESTART can only mean that the anon was freed,
493 1.5 chs * so again there's nothing to do.
494 1.5 chs */
495 1.5 chs
496 1.5 chs return FALSE;
497 1.5 chs }
498 1.5 chs
499 1.5 chs /*
500 1.5 chs * ok, we've got the page now.
501 1.5 chs * mark it as dirty, clear its swslot and un-busy it.
502 1.5 chs */
503 1.5 chs
504 1.5 chs pg = anon->u.an_page;
505 1.5 chs uobj = pg->uobject;
506 1.5 chs uvm_swap_free(anon->an_swslot, 1);
507 1.5 chs anon->an_swslot = 0;
508 1.5 chs pg->flags &= ~(PG_CLEAN);
509 1.5 chs
510 1.5 chs /*
511 1.5 chs * deactivate the page (to put it on a page queue)
512 1.5 chs */
513 1.5 chs
514 1.5 chs pmap_clear_reference(pg);
515 1.5 chs uvm_lock_pageq();
516 1.5 chs uvm_pagedeactivate(pg);
517 1.5 chs uvm_unlock_pageq();
518 1.5 chs
519 1.5 chs /*
520 1.5 chs * unlock the anon and we're done.
521 1.5 chs */
522 1.5 chs
523 1.5 chs simple_unlock(&anon->an_lock);
524 1.5 chs if (uobj) {
525 1.5 chs simple_unlock(&uobj->vmobjlock);
526 1.5 chs }
527 1.5 chs return FALSE;
528 1.1 chuck }
529