Home | History | Annotate | Line # | Download | only in uvm
uvm_anon.c revision 1.12
      1 /*	$NetBSD: uvm_anon.c,v 1.12 2001/01/23 01:56:16 thorpej Exp $	*/
      2 
      3 /*
      4  *
      5  * Copyright (c) 1997 Charles D. Cranor and Washington University.
      6  * All rights reserved.
      7  *
      8  * Redistribution and use in source and binary forms, with or without
      9  * modification, are permitted provided that the following conditions
     10  * are met:
     11  * 1. Redistributions of source code must retain the above copyright
     12  *    notice, this list of conditions and the following disclaimer.
     13  * 2. Redistributions in binary form must reproduce the above copyright
     14  *    notice, this list of conditions and the following disclaimer in the
     15  *    documentation and/or other materials provided with the distribution.
     16  * 3. All advertising materials mentioning features or use of this software
     17  *    must display the following acknowledgement:
     18  *      This product includes software developed by Charles D. Cranor and
     19  *      Washington University.
     20  * 4. The name of the author may not be used to endorse or promote products
     21  *    derived from this software without specific prior written permission.
     22  *
     23  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
     24  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
     25  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
     26  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
     27  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
     28  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
     29  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
     30  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
     31  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
     32  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
     33  */
     34 
     35 /*
     36  * uvm_anon.c: uvm anon ops
     37  */
     38 
     39 #include "opt_uvmhist.h"
     40 
     41 #include <sys/param.h>
     42 #include <sys/systm.h>
     43 #include <sys/proc.h>
     44 #include <sys/malloc.h>
     45 #include <sys/pool.h>
     46 #include <sys/kernel.h>
     47 
     48 #include <uvm/uvm.h>
     49 #include <uvm/uvm_swap.h>
     50 
     51 /*
     52  * anonblock_list: global list of anon blocks,
     53  * locked by swap_syscall_lock (since we never remove
     54  * anything from this list and we only add to it via swapctl(2)).
     55  */
     56 
     57 struct uvm_anonblock {
     58 	LIST_ENTRY(uvm_anonblock) list;
     59 	int count;
     60 	struct vm_anon *anons;
     61 };
     62 static LIST_HEAD(anonlist, uvm_anonblock) anonblock_list;
     63 
     64 
     65 static boolean_t anon_pagein __P((struct vm_anon *));
     66 
     67 
     68 /*
     69  * allocate anons
     70  */
     71 void
     72 uvm_anon_init()
     73 {
     74 	int nanon = uvmexp.free - (uvmexp.free / 16); /* XXXCDC ??? */
     75 
     76 	simple_lock_init(&uvm.afreelock);
     77 	LIST_INIT(&anonblock_list);
     78 
     79 	/*
     80 	 * Allocate the initial anons.
     81 	 */
     82 	uvm_anon_add(nanon);
     83 }
     84 
     85 /*
     86  * add some more anons to the free pool.  called when we add
     87  * more swap space.
     88  *
     89  * => swap_syscall_lock should be held (protects anonblock_list).
     90  */
     91 int
     92 uvm_anon_add(count)
     93 	int	count;
     94 {
     95 	struct uvm_anonblock *anonblock;
     96 	struct vm_anon *anon;
     97 	int lcv, needed;
     98 
     99 	simple_lock(&uvm.afreelock);
    100 	uvmexp.nanonneeded += count;
    101 	needed = uvmexp.nanonneeded - uvmexp.nanon;
    102 	simple_unlock(&uvm.afreelock);
    103 
    104 	if (needed <= 0) {
    105 		return 0;
    106 	}
    107 	anon = (void *)uvm_km_alloc(kernel_map, sizeof(*anon) * needed);
    108 	if (anon == NULL) {
    109 		simple_lock(&uvm.afreelock);
    110 		uvmexp.nanonneeded -= count;
    111 		simple_unlock(&uvm.afreelock);
    112 		return ENOMEM;
    113 	}
    114 	MALLOC(anonblock, void *, sizeof(*anonblock), M_UVMAMAP, M_WAITOK);
    115 
    116 	anonblock->count = needed;
    117 	anonblock->anons = anon;
    118 	LIST_INSERT_HEAD(&anonblock_list, anonblock, list);
    119 	memset(anon, 0, sizeof(*anon) * needed);
    120 
    121 	simple_lock(&uvm.afreelock);
    122 	uvmexp.nanon += needed;
    123 	uvmexp.nfreeanon += needed;
    124 	for (lcv = 0; lcv < needed; lcv++) {
    125 		simple_lock_init(&anon->an_lock);
    126 		anon[lcv].u.an_nxt = uvm.afree;
    127 		uvm.afree = &anon[lcv];
    128 		simple_lock_init(&uvm.afree->an_lock);
    129 	}
    130 	simple_unlock(&uvm.afreelock);
    131 	return 0;
    132 }
    133 
    134 /*
    135  * remove anons from the free pool.
    136  */
    137 void
    138 uvm_anon_remove(count)
    139 	int count;
    140 {
    141 	/*
    142 	 * we never actually free any anons, to avoid allocation overhead.
    143 	 * XXX someday we might want to try to free anons.
    144 	 */
    145 
    146 	simple_lock(&uvm.afreelock);
    147 	uvmexp.nanonneeded -= count;
    148 	simple_unlock(&uvm.afreelock);
    149 }
    150 
    151 /*
    152  * allocate an anon
    153  */
    154 struct vm_anon *
    155 uvm_analloc()
    156 {
    157 	struct vm_anon *a;
    158 
    159 	simple_lock(&uvm.afreelock);
    160 	a = uvm.afree;
    161 	if (a) {
    162 		uvm.afree = a->u.an_nxt;
    163 		uvmexp.nfreeanon--;
    164 		a->an_ref = 1;
    165 		a->an_swslot = 0;
    166 		a->u.an_page = NULL;		/* so we can free quickly */
    167 	}
    168 	simple_unlock(&uvm.afreelock);
    169 	return(a);
    170 }
    171 
    172 /*
    173  * uvm_anfree: free a single anon structure
    174  *
    175  * => caller must remove anon from its amap before calling (if it was in
    176  *	an amap).
    177  * => anon must be unlocked and have a zero reference count.
    178  * => we may lock the pageq's.
    179  */
    180 void
    181 uvm_anfree(anon)
    182 	struct vm_anon *anon;
    183 {
    184 	struct vm_page *pg;
    185 	UVMHIST_FUNC("uvm_anfree"); UVMHIST_CALLED(maphist);
    186 	UVMHIST_LOG(maphist,"(anon=0x%x)", anon, 0,0,0);
    187 
    188 	KASSERT(anon->an_ref == 0);
    189 	LOCK_ASSERT(simple_lock_held(&anon->an_lock) == 0);
    190 
    191 	/*
    192 	 * get page
    193 	 */
    194 
    195 	pg = anon->u.an_page;
    196 
    197 	/*
    198 	 * if there is a resident page and it is loaned, then anon may not
    199 	 * own it.   call out to uvm_anon_lockpage() to ensure the real owner
    200  	 * of the page has been identified and locked.
    201 	 */
    202 
    203 	if (pg && pg->loan_count)
    204 		pg = uvm_anon_lockloanpg(anon);
    205 
    206 	/*
    207 	 * if we have a resident page, we must dispose of it before freeing
    208 	 * the anon.
    209 	 */
    210 
    211 	if (pg) {
    212 
    213 		/*
    214 		 * if the page is owned by a uobject (now locked), then we must
    215 		 * kill the loan on the page rather than free it.
    216 		 */
    217 
    218 		if (pg->uobject) {
    219 			uvm_lock_pageq();
    220 			KASSERT(pg->loan_count > 0);
    221 			pg->loan_count--;
    222 			pg->uanon = NULL;
    223 			uvm_unlock_pageq();
    224 			simple_unlock(&pg->uobject->vmobjlock);
    225 		} else {
    226 
    227 			/*
    228 			 * page has no uobject, so we must be the owner of it.
    229 			 *
    230 			 * if page is busy then we just mark it as released
    231 			 * (who ever has it busy must check for this when they
    232 			 * wake up).    if the page is not busy then we can
    233 			 * free it now.
    234 			 */
    235 
    236 			if ((pg->flags & PG_BUSY) != 0) {
    237 				/* tell them to dump it when done */
    238 				pg->flags |= PG_RELEASED;
    239 				UVMHIST_LOG(maphist,
    240 				    "  anon 0x%x, page 0x%x: BUSY (released!)",
    241 				    anon, pg, 0, 0);
    242 				return;
    243 			}
    244 			pmap_page_protect(pg, VM_PROT_NONE);
    245 			uvm_lock_pageq();	/* lock out pagedaemon */
    246 			uvm_pagefree(pg);	/* bye bye */
    247 			uvm_unlock_pageq();	/* free the daemon */
    248 			UVMHIST_LOG(maphist,"anon 0x%x, page 0x%x: freed now!",
    249 			    anon, pg, 0, 0);
    250 		}
    251 	}
    252 
    253 	/*
    254 	 * free any swap resources.
    255 	 */
    256 	uvm_anon_dropswap(anon);
    257 
    258 	/*
    259 	 * now that we've stripped the data areas from the anon, free the anon
    260 	 * itself!
    261 	 */
    262 	simple_lock(&uvm.afreelock);
    263 	anon->u.an_nxt = uvm.afree;
    264 	uvm.afree = anon;
    265 	uvmexp.nfreeanon++;
    266 	simple_unlock(&uvm.afreelock);
    267 	UVMHIST_LOG(maphist,"<- done!",0,0,0,0);
    268 }
    269 
    270 /*
    271  * uvm_anon_dropswap:  release any swap resources from this anon.
    272  *
    273  * => anon must be locked or have a reference count of 0.
    274  */
    275 void
    276 uvm_anon_dropswap(anon)
    277 	struct vm_anon *anon;
    278 {
    279 	UVMHIST_FUNC("uvm_anon_dropswap"); UVMHIST_CALLED(maphist);
    280 
    281 	if (anon->an_swslot == 0)
    282 		return;
    283 
    284 	UVMHIST_LOG(maphist,"freeing swap for anon %p, paged to swslot 0x%x",
    285 		    anon, anon->an_swslot, 0, 0);
    286 	uvm_swap_free(anon->an_swslot, 1);
    287 	anon->an_swslot = 0;
    288 
    289 	if (anon->u.an_page == NULL) {
    290 		/* this page is no longer only in swap. */
    291 		simple_lock(&uvm.swap_data_lock);
    292 		uvmexp.swpgonly--;
    293 		simple_unlock(&uvm.swap_data_lock);
    294 	}
    295 }
    296 
    297 /*
    298  * uvm_anon_lockloanpg: given a locked anon, lock its resident page
    299  *
    300  * => anon is locked by caller
    301  * => on return: anon is locked
    302  *		 if there is a resident page:
    303  *			if it has a uobject, it is locked by us
    304  *			if it is ownerless, we take over as owner
    305  *		 we return the resident page (it can change during
    306  *		 this function)
    307  * => note that the only time an anon has an ownerless resident page
    308  *	is if the page was loaned from a uvm_object and the uvm_object
    309  *	disowned it
    310  * => this only needs to be called when you want to do an operation
    311  *	on an anon's resident page and that page has a non-zero loan
    312  *	count.
    313  */
    314 struct vm_page *
    315 uvm_anon_lockloanpg(anon)
    316 	struct vm_anon *anon;
    317 {
    318 	struct vm_page *pg;
    319 	boolean_t locked = FALSE;
    320 
    321 	LOCK_ASSERT(simple_lock_held(&anon->an_lock));
    322 
    323 	/*
    324 	 * loop while we have a resident page that has a non-zero loan count.
    325 	 * if we successfully get our lock, we will "break" the loop.
    326 	 * note that the test for pg->loan_count is not protected -- this
    327 	 * may produce false positive results.   note that a false positive
    328 	 * result may cause us to do more work than we need to, but it will
    329 	 * not produce an incorrect result.
    330 	 */
    331 
    332 	while (((pg = anon->u.an_page) != NULL) && pg->loan_count != 0) {
    333 
    334 		/*
    335 		 * quickly check to see if the page has an object before
    336 		 * bothering to lock the page queues.   this may also produce
    337 		 * a false positive result, but that's ok because we do a real
    338 		 * check after that.
    339 		 *
    340 		 * XXX: quick check -- worth it?   need volatile?
    341 		 */
    342 
    343 		if (pg->uobject) {
    344 
    345 			uvm_lock_pageq();
    346 			if (pg->uobject) {	/* the "real" check */
    347 				locked =
    348 				    simple_lock_try(&pg->uobject->vmobjlock);
    349 			} else {
    350 				/* object disowned before we got PQ lock */
    351 				locked = TRUE;
    352 			}
    353 			uvm_unlock_pageq();
    354 
    355 			/*
    356 			 * if we didn't get a lock (try lock failed), then we
    357 			 * toggle our anon lock and try again
    358 			 */
    359 
    360 			if (!locked) {
    361 				simple_unlock(&anon->an_lock);
    362 
    363 				/*
    364 				 * someone locking the object has a chance to
    365 				 * lock us right now
    366 				 */
    367 
    368 				simple_lock(&anon->an_lock);
    369 				continue;
    370 			}
    371 		}
    372 
    373 		/*
    374 		 * if page is un-owned [i.e. the object dropped its ownership],
    375 		 * then we can take over as owner!
    376 		 */
    377 
    378 		if (pg->uobject == NULL && (pg->pqflags & PQ_ANON) == 0) {
    379 			uvm_lock_pageq();
    380 			pg->pqflags |= PQ_ANON;		/* take ownership... */
    381 			pg->loan_count--;	/* ... and drop our loan */
    382 			uvm_unlock_pageq();
    383 		}
    384 
    385 		/*
    386 		 * we did it!   break the loop
    387 		 */
    388 
    389 		break;
    390 	}
    391 	return(pg);
    392 }
    393 
    394 
    395 
    396 /*
    397  * page in every anon that is paged out to a range of swslots.
    398  *
    399  * swap_syscall_lock should be held (protects anonblock_list).
    400  */
    401 
    402 boolean_t
    403 anon_swap_off(startslot, endslot)
    404 	int startslot, endslot;
    405 {
    406 	struct uvm_anonblock *anonblock;
    407 
    408 	for (anonblock = LIST_FIRST(&anonblock_list);
    409 	     anonblock != NULL;
    410 	     anonblock = LIST_NEXT(anonblock, list)) {
    411 		int i;
    412 
    413 		/*
    414 		 * loop thru all the anons in the anonblock,
    415 		 * paging in where needed.
    416 		 */
    417 
    418 		for (i = 0; i < anonblock->count; i++) {
    419 			struct vm_anon *anon = &anonblock->anons[i];
    420 			int slot;
    421 
    422 			/*
    423 			 * lock anon to work on it.
    424 			 */
    425 
    426 			simple_lock(&anon->an_lock);
    427 
    428 			/*
    429 			 * is this anon's swap slot in range?
    430 			 */
    431 
    432 			slot = anon->an_swslot;
    433 			if (slot >= startslot && slot < endslot) {
    434 				boolean_t rv;
    435 
    436 				/*
    437 				 * yup, page it in.
    438 				 */
    439 
    440 				/* locked: anon */
    441 				rv = anon_pagein(anon);
    442 				/* unlocked: anon */
    443 
    444 				if (rv) {
    445 					return rv;
    446 				}
    447 			} else {
    448 
    449 				/*
    450 				 * nope, unlock and proceed.
    451 				 */
    452 
    453 				simple_unlock(&anon->an_lock);
    454 			}
    455 		}
    456 	}
    457 	return FALSE;
    458 }
    459 
    460 
    461 /*
    462  * fetch an anon's page.
    463  *
    464  * => anon must be locked, and is unlocked upon return.
    465  * => returns TRUE if pagein was aborted due to lack of memory.
    466  */
    467 
    468 static boolean_t
    469 anon_pagein(anon)
    470 	struct vm_anon *anon;
    471 {
    472 	struct vm_page *pg;
    473 	struct uvm_object *uobj;
    474 	int rv;
    475 
    476 	/* locked: anon */
    477 	LOCK_ASSERT(simple_lock_held(&anon->an_lock));
    478 
    479 	rv = uvmfault_anonget(NULL, NULL, anon);
    480 
    481 	/*
    482 	 * if rv == VM_PAGER_OK, anon is still locked, else anon
    483 	 * is unlocked
    484 	 */
    485 
    486 	switch (rv) {
    487 	case VM_PAGER_OK:
    488 		break;
    489 
    490 	case VM_PAGER_ERROR:
    491 	case VM_PAGER_REFAULT:
    492 
    493 		/*
    494 		 * nothing more to do on errors.
    495 		 * VM_PAGER_REFAULT can only mean that the anon was freed,
    496 		 * so again there's nothing to do.
    497 		 */
    498 
    499 		return FALSE;
    500 
    501 	default:
    502 #ifdef DIAGNOSTIC
    503 		panic("anon_pagein: uvmfault_anonget -> %d", rv);
    504 #else
    505 		return FALSE;
    506 #endif
    507 	}
    508 
    509 	/*
    510 	 * ok, we've got the page now.
    511 	 * mark it as dirty, clear its swslot and un-busy it.
    512 	 */
    513 
    514 	pg = anon->u.an_page;
    515 	uobj = pg->uobject;
    516 	uvm_swap_free(anon->an_swslot, 1);
    517 	anon->an_swslot = 0;
    518 	pg->flags &= ~(PG_CLEAN);
    519 
    520 	/*
    521 	 * deactivate the page (to put it on a page queue)
    522 	 */
    523 
    524 	pmap_clear_reference(pg);
    525 	pmap_page_protect(pg, VM_PROT_NONE);
    526 	uvm_lock_pageq();
    527 	uvm_pagedeactivate(pg);
    528 	uvm_unlock_pageq();
    529 
    530 	/*
    531 	 * unlock the anon and we're done.
    532 	 */
    533 
    534 	simple_unlock(&anon->an_lock);
    535 	if (uobj) {
    536 		simple_unlock(&uobj->vmobjlock);
    537 	}
    538 	return FALSE;
    539 }
    540