uvm_anon.c revision 1.12 1 /* $NetBSD: uvm_anon.c,v 1.12 2001/01/23 01:56:16 thorpej Exp $ */
2
3 /*
4 *
5 * Copyright (c) 1997 Charles D. Cranor and Washington University.
6 * All rights reserved.
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
10 * are met:
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in the
15 * documentation and/or other materials provided with the distribution.
16 * 3. All advertising materials mentioning features or use of this software
17 * must display the following acknowledgement:
18 * This product includes software developed by Charles D. Cranor and
19 * Washington University.
20 * 4. The name of the author may not be used to endorse or promote products
21 * derived from this software without specific prior written permission.
22 *
23 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
24 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
25 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
26 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
27 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
28 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
29 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
30 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
31 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
32 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
33 */
34
35 /*
36 * uvm_anon.c: uvm anon ops
37 */
38
39 #include "opt_uvmhist.h"
40
41 #include <sys/param.h>
42 #include <sys/systm.h>
43 #include <sys/proc.h>
44 #include <sys/malloc.h>
45 #include <sys/pool.h>
46 #include <sys/kernel.h>
47
48 #include <uvm/uvm.h>
49 #include <uvm/uvm_swap.h>
50
51 /*
52 * anonblock_list: global list of anon blocks,
53 * locked by swap_syscall_lock (since we never remove
54 * anything from this list and we only add to it via swapctl(2)).
55 */
56
57 struct uvm_anonblock {
58 LIST_ENTRY(uvm_anonblock) list;
59 int count;
60 struct vm_anon *anons;
61 };
62 static LIST_HEAD(anonlist, uvm_anonblock) anonblock_list;
63
64
65 static boolean_t anon_pagein __P((struct vm_anon *));
66
67
68 /*
69 * allocate anons
70 */
71 void
72 uvm_anon_init()
73 {
74 int nanon = uvmexp.free - (uvmexp.free / 16); /* XXXCDC ??? */
75
76 simple_lock_init(&uvm.afreelock);
77 LIST_INIT(&anonblock_list);
78
79 /*
80 * Allocate the initial anons.
81 */
82 uvm_anon_add(nanon);
83 }
84
85 /*
86 * add some more anons to the free pool. called when we add
87 * more swap space.
88 *
89 * => swap_syscall_lock should be held (protects anonblock_list).
90 */
91 int
92 uvm_anon_add(count)
93 int count;
94 {
95 struct uvm_anonblock *anonblock;
96 struct vm_anon *anon;
97 int lcv, needed;
98
99 simple_lock(&uvm.afreelock);
100 uvmexp.nanonneeded += count;
101 needed = uvmexp.nanonneeded - uvmexp.nanon;
102 simple_unlock(&uvm.afreelock);
103
104 if (needed <= 0) {
105 return 0;
106 }
107 anon = (void *)uvm_km_alloc(kernel_map, sizeof(*anon) * needed);
108 if (anon == NULL) {
109 simple_lock(&uvm.afreelock);
110 uvmexp.nanonneeded -= count;
111 simple_unlock(&uvm.afreelock);
112 return ENOMEM;
113 }
114 MALLOC(anonblock, void *, sizeof(*anonblock), M_UVMAMAP, M_WAITOK);
115
116 anonblock->count = needed;
117 anonblock->anons = anon;
118 LIST_INSERT_HEAD(&anonblock_list, anonblock, list);
119 memset(anon, 0, sizeof(*anon) * needed);
120
121 simple_lock(&uvm.afreelock);
122 uvmexp.nanon += needed;
123 uvmexp.nfreeanon += needed;
124 for (lcv = 0; lcv < needed; lcv++) {
125 simple_lock_init(&anon->an_lock);
126 anon[lcv].u.an_nxt = uvm.afree;
127 uvm.afree = &anon[lcv];
128 simple_lock_init(&uvm.afree->an_lock);
129 }
130 simple_unlock(&uvm.afreelock);
131 return 0;
132 }
133
134 /*
135 * remove anons from the free pool.
136 */
137 void
138 uvm_anon_remove(count)
139 int count;
140 {
141 /*
142 * we never actually free any anons, to avoid allocation overhead.
143 * XXX someday we might want to try to free anons.
144 */
145
146 simple_lock(&uvm.afreelock);
147 uvmexp.nanonneeded -= count;
148 simple_unlock(&uvm.afreelock);
149 }
150
151 /*
152 * allocate an anon
153 */
154 struct vm_anon *
155 uvm_analloc()
156 {
157 struct vm_anon *a;
158
159 simple_lock(&uvm.afreelock);
160 a = uvm.afree;
161 if (a) {
162 uvm.afree = a->u.an_nxt;
163 uvmexp.nfreeanon--;
164 a->an_ref = 1;
165 a->an_swslot = 0;
166 a->u.an_page = NULL; /* so we can free quickly */
167 }
168 simple_unlock(&uvm.afreelock);
169 return(a);
170 }
171
172 /*
173 * uvm_anfree: free a single anon structure
174 *
175 * => caller must remove anon from its amap before calling (if it was in
176 * an amap).
177 * => anon must be unlocked and have a zero reference count.
178 * => we may lock the pageq's.
179 */
180 void
181 uvm_anfree(anon)
182 struct vm_anon *anon;
183 {
184 struct vm_page *pg;
185 UVMHIST_FUNC("uvm_anfree"); UVMHIST_CALLED(maphist);
186 UVMHIST_LOG(maphist,"(anon=0x%x)", anon, 0,0,0);
187
188 KASSERT(anon->an_ref == 0);
189 LOCK_ASSERT(simple_lock_held(&anon->an_lock) == 0);
190
191 /*
192 * get page
193 */
194
195 pg = anon->u.an_page;
196
197 /*
198 * if there is a resident page and it is loaned, then anon may not
199 * own it. call out to uvm_anon_lockpage() to ensure the real owner
200 * of the page has been identified and locked.
201 */
202
203 if (pg && pg->loan_count)
204 pg = uvm_anon_lockloanpg(anon);
205
206 /*
207 * if we have a resident page, we must dispose of it before freeing
208 * the anon.
209 */
210
211 if (pg) {
212
213 /*
214 * if the page is owned by a uobject (now locked), then we must
215 * kill the loan on the page rather than free it.
216 */
217
218 if (pg->uobject) {
219 uvm_lock_pageq();
220 KASSERT(pg->loan_count > 0);
221 pg->loan_count--;
222 pg->uanon = NULL;
223 uvm_unlock_pageq();
224 simple_unlock(&pg->uobject->vmobjlock);
225 } else {
226
227 /*
228 * page has no uobject, so we must be the owner of it.
229 *
230 * if page is busy then we just mark it as released
231 * (who ever has it busy must check for this when they
232 * wake up). if the page is not busy then we can
233 * free it now.
234 */
235
236 if ((pg->flags & PG_BUSY) != 0) {
237 /* tell them to dump it when done */
238 pg->flags |= PG_RELEASED;
239 UVMHIST_LOG(maphist,
240 " anon 0x%x, page 0x%x: BUSY (released!)",
241 anon, pg, 0, 0);
242 return;
243 }
244 pmap_page_protect(pg, VM_PROT_NONE);
245 uvm_lock_pageq(); /* lock out pagedaemon */
246 uvm_pagefree(pg); /* bye bye */
247 uvm_unlock_pageq(); /* free the daemon */
248 UVMHIST_LOG(maphist,"anon 0x%x, page 0x%x: freed now!",
249 anon, pg, 0, 0);
250 }
251 }
252
253 /*
254 * free any swap resources.
255 */
256 uvm_anon_dropswap(anon);
257
258 /*
259 * now that we've stripped the data areas from the anon, free the anon
260 * itself!
261 */
262 simple_lock(&uvm.afreelock);
263 anon->u.an_nxt = uvm.afree;
264 uvm.afree = anon;
265 uvmexp.nfreeanon++;
266 simple_unlock(&uvm.afreelock);
267 UVMHIST_LOG(maphist,"<- done!",0,0,0,0);
268 }
269
270 /*
271 * uvm_anon_dropswap: release any swap resources from this anon.
272 *
273 * => anon must be locked or have a reference count of 0.
274 */
275 void
276 uvm_anon_dropswap(anon)
277 struct vm_anon *anon;
278 {
279 UVMHIST_FUNC("uvm_anon_dropswap"); UVMHIST_CALLED(maphist);
280
281 if (anon->an_swslot == 0)
282 return;
283
284 UVMHIST_LOG(maphist,"freeing swap for anon %p, paged to swslot 0x%x",
285 anon, anon->an_swslot, 0, 0);
286 uvm_swap_free(anon->an_swslot, 1);
287 anon->an_swslot = 0;
288
289 if (anon->u.an_page == NULL) {
290 /* this page is no longer only in swap. */
291 simple_lock(&uvm.swap_data_lock);
292 uvmexp.swpgonly--;
293 simple_unlock(&uvm.swap_data_lock);
294 }
295 }
296
297 /*
298 * uvm_anon_lockloanpg: given a locked anon, lock its resident page
299 *
300 * => anon is locked by caller
301 * => on return: anon is locked
302 * if there is a resident page:
303 * if it has a uobject, it is locked by us
304 * if it is ownerless, we take over as owner
305 * we return the resident page (it can change during
306 * this function)
307 * => note that the only time an anon has an ownerless resident page
308 * is if the page was loaned from a uvm_object and the uvm_object
309 * disowned it
310 * => this only needs to be called when you want to do an operation
311 * on an anon's resident page and that page has a non-zero loan
312 * count.
313 */
314 struct vm_page *
315 uvm_anon_lockloanpg(anon)
316 struct vm_anon *anon;
317 {
318 struct vm_page *pg;
319 boolean_t locked = FALSE;
320
321 LOCK_ASSERT(simple_lock_held(&anon->an_lock));
322
323 /*
324 * loop while we have a resident page that has a non-zero loan count.
325 * if we successfully get our lock, we will "break" the loop.
326 * note that the test for pg->loan_count is not protected -- this
327 * may produce false positive results. note that a false positive
328 * result may cause us to do more work than we need to, but it will
329 * not produce an incorrect result.
330 */
331
332 while (((pg = anon->u.an_page) != NULL) && pg->loan_count != 0) {
333
334 /*
335 * quickly check to see if the page has an object before
336 * bothering to lock the page queues. this may also produce
337 * a false positive result, but that's ok because we do a real
338 * check after that.
339 *
340 * XXX: quick check -- worth it? need volatile?
341 */
342
343 if (pg->uobject) {
344
345 uvm_lock_pageq();
346 if (pg->uobject) { /* the "real" check */
347 locked =
348 simple_lock_try(&pg->uobject->vmobjlock);
349 } else {
350 /* object disowned before we got PQ lock */
351 locked = TRUE;
352 }
353 uvm_unlock_pageq();
354
355 /*
356 * if we didn't get a lock (try lock failed), then we
357 * toggle our anon lock and try again
358 */
359
360 if (!locked) {
361 simple_unlock(&anon->an_lock);
362
363 /*
364 * someone locking the object has a chance to
365 * lock us right now
366 */
367
368 simple_lock(&anon->an_lock);
369 continue;
370 }
371 }
372
373 /*
374 * if page is un-owned [i.e. the object dropped its ownership],
375 * then we can take over as owner!
376 */
377
378 if (pg->uobject == NULL && (pg->pqflags & PQ_ANON) == 0) {
379 uvm_lock_pageq();
380 pg->pqflags |= PQ_ANON; /* take ownership... */
381 pg->loan_count--; /* ... and drop our loan */
382 uvm_unlock_pageq();
383 }
384
385 /*
386 * we did it! break the loop
387 */
388
389 break;
390 }
391 return(pg);
392 }
393
394
395
396 /*
397 * page in every anon that is paged out to a range of swslots.
398 *
399 * swap_syscall_lock should be held (protects anonblock_list).
400 */
401
402 boolean_t
403 anon_swap_off(startslot, endslot)
404 int startslot, endslot;
405 {
406 struct uvm_anonblock *anonblock;
407
408 for (anonblock = LIST_FIRST(&anonblock_list);
409 anonblock != NULL;
410 anonblock = LIST_NEXT(anonblock, list)) {
411 int i;
412
413 /*
414 * loop thru all the anons in the anonblock,
415 * paging in where needed.
416 */
417
418 for (i = 0; i < anonblock->count; i++) {
419 struct vm_anon *anon = &anonblock->anons[i];
420 int slot;
421
422 /*
423 * lock anon to work on it.
424 */
425
426 simple_lock(&anon->an_lock);
427
428 /*
429 * is this anon's swap slot in range?
430 */
431
432 slot = anon->an_swslot;
433 if (slot >= startslot && slot < endslot) {
434 boolean_t rv;
435
436 /*
437 * yup, page it in.
438 */
439
440 /* locked: anon */
441 rv = anon_pagein(anon);
442 /* unlocked: anon */
443
444 if (rv) {
445 return rv;
446 }
447 } else {
448
449 /*
450 * nope, unlock and proceed.
451 */
452
453 simple_unlock(&anon->an_lock);
454 }
455 }
456 }
457 return FALSE;
458 }
459
460
461 /*
462 * fetch an anon's page.
463 *
464 * => anon must be locked, and is unlocked upon return.
465 * => returns TRUE if pagein was aborted due to lack of memory.
466 */
467
468 static boolean_t
469 anon_pagein(anon)
470 struct vm_anon *anon;
471 {
472 struct vm_page *pg;
473 struct uvm_object *uobj;
474 int rv;
475
476 /* locked: anon */
477 LOCK_ASSERT(simple_lock_held(&anon->an_lock));
478
479 rv = uvmfault_anonget(NULL, NULL, anon);
480
481 /*
482 * if rv == VM_PAGER_OK, anon is still locked, else anon
483 * is unlocked
484 */
485
486 switch (rv) {
487 case VM_PAGER_OK:
488 break;
489
490 case VM_PAGER_ERROR:
491 case VM_PAGER_REFAULT:
492
493 /*
494 * nothing more to do on errors.
495 * VM_PAGER_REFAULT can only mean that the anon was freed,
496 * so again there's nothing to do.
497 */
498
499 return FALSE;
500
501 default:
502 #ifdef DIAGNOSTIC
503 panic("anon_pagein: uvmfault_anonget -> %d", rv);
504 #else
505 return FALSE;
506 #endif
507 }
508
509 /*
510 * ok, we've got the page now.
511 * mark it as dirty, clear its swslot and un-busy it.
512 */
513
514 pg = anon->u.an_page;
515 uobj = pg->uobject;
516 uvm_swap_free(anon->an_swslot, 1);
517 anon->an_swslot = 0;
518 pg->flags &= ~(PG_CLEAN);
519
520 /*
521 * deactivate the page (to put it on a page queue)
522 */
523
524 pmap_clear_reference(pg);
525 pmap_page_protect(pg, VM_PROT_NONE);
526 uvm_lock_pageq();
527 uvm_pagedeactivate(pg);
528 uvm_unlock_pageq();
529
530 /*
531 * unlock the anon and we're done.
532 */
533
534 simple_unlock(&anon->an_lock);
535 if (uobj) {
536 simple_unlock(&uobj->vmobjlock);
537 }
538 return FALSE;
539 }
540