Home | History | Annotate | Line # | Download | only in uvm
uvm_pager.c revision 1.107.2.2
      1  1.107.2.2      yamt /*	$NetBSD: uvm_pager.c,v 1.107.2.2 2012/01/24 02:10:47 yamt Exp $	*/
      2        1.1       mrg 
      3        1.1       mrg /*
      4        1.1       mrg  * Copyright (c) 1997 Charles D. Cranor and Washington University.
      5        1.1       mrg  * All rights reserved.
      6        1.1       mrg  *
      7        1.1       mrg  * Redistribution and use in source and binary forms, with or without
      8        1.1       mrg  * modification, are permitted provided that the following conditions
      9        1.1       mrg  * are met:
     10        1.1       mrg  * 1. Redistributions of source code must retain the above copyright
     11        1.1       mrg  *    notice, this list of conditions and the following disclaimer.
     12        1.1       mrg  * 2. Redistributions in binary form must reproduce the above copyright
     13        1.1       mrg  *    notice, this list of conditions and the following disclaimer in the
     14        1.1       mrg  *    documentation and/or other materials provided with the distribution.
     15        1.1       mrg  *
     16        1.1       mrg  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
     17        1.1       mrg  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
     18        1.1       mrg  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
     19        1.1       mrg  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
     20        1.1       mrg  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
     21        1.1       mrg  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
     22        1.1       mrg  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
     23        1.1       mrg  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
     24        1.1       mrg  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
     25        1.1       mrg  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
     26        1.3       mrg  *
     27        1.3       mrg  * from: Id: uvm_pager.c,v 1.1.2.23 1998/02/02 20:38:06 chuck Exp
     28        1.1       mrg  */
     29        1.1       mrg 
     30        1.1       mrg /*
     31        1.1       mrg  * uvm_pager.c: generic functions used to assist the pagers.
     32        1.1       mrg  */
     33       1.54     lukem 
     34       1.54     lukem #include <sys/cdefs.h>
     35  1.107.2.2      yamt __KERNEL_RCSID(0, "$NetBSD: uvm_pager.c,v 1.107.2.2 2012/01/24 02:10:47 yamt Exp $");
     36       1.54     lukem 
     37       1.54     lukem #include "opt_uvmhist.h"
     38       1.72      yamt #include "opt_readahead.h"
     39       1.87      yamt #include "opt_pagermap.h"
     40        1.1       mrg 
     41        1.1       mrg #include <sys/param.h>
     42        1.1       mrg #include <sys/systm.h>
     43       1.35       chs #include <sys/vnode.h>
     44       1.93     pooka #include <sys/buf.h>
     45        1.1       mrg 
     46        1.1       mrg #include <uvm/uvm.h>
     47        1.1       mrg 
     48       1.87      yamt /*
     49       1.87      yamt  * XXX
     50       1.87      yamt  * this is needed until the device strategy interface
     51       1.87      yamt  * is changed to do physically-addressed i/o.
     52       1.87      yamt  */
     53       1.87      yamt 
     54       1.87      yamt #ifndef PAGER_MAP_DEFAULT_SIZE
     55       1.87      yamt #define PAGER_MAP_DEFAULT_SIZE	(16 * 1024 * 1024)
     56       1.87      yamt #endif
     57       1.87      yamt 
     58       1.87      yamt #ifndef PAGER_MAP_SIZE
     59       1.87      yamt #define PAGER_MAP_SIZE	PAGER_MAP_DEFAULT_SIZE
     60       1.87      yamt #endif
     61       1.87      yamt 
     62       1.87      yamt size_t pager_map_size = PAGER_MAP_SIZE;
     63       1.87      yamt 
     64        1.1       mrg /*
     65        1.1       mrg  * list of uvm pagers in the system
     66        1.1       mrg  */
     67        1.1       mrg 
     68       1.89      yamt const struct uvm_pagerops * const uvmpagerops[] = {
     69       1.10   thorpej 	&aobj_pager,
     70        1.6       mrg 	&uvm_deviceops,
     71        1.6       mrg 	&uvm_vnodeops,
     72       1.35       chs 	&ubc_pager,
     73        1.1       mrg };
     74        1.1       mrg 
     75        1.1       mrg /*
     76        1.1       mrg  * the pager map: provides KVA for I/O
     77        1.1       mrg  */
     78        1.1       mrg 
     79       1.47       chs struct vm_map *pager_map;		/* XXX */
     80       1.84        ad kmutex_t pager_map_wanted_lock;
     81       1.80   thorpej bool pager_map_wanted;	/* locked by pager map */
     82       1.35       chs static vaddr_t emergva;
     83      1.105      matt static int emerg_ncolors;
     84       1.80   thorpej static bool emerginuse;
     85        1.1       mrg 
     86      1.105      matt void
     87      1.105      matt uvm_pager_realloc_emerg(void)
     88      1.105      matt {
     89      1.105      matt 	vaddr_t new_emergva, old_emergva;
     90      1.105      matt 	int old_emerg_ncolors;
     91      1.105      matt 
     92      1.105      matt 	if (__predict_true(emergva != 0 && emerg_ncolors >= uvmexp.ncolors))
     93      1.105      matt 		return;
     94      1.105      matt 
     95      1.105      matt 	KASSERT(!emerginuse);
     96      1.105      matt 
     97      1.105      matt 	new_emergva = uvm_km_alloc(kernel_map,
     98      1.106  uebayasi 	    round_page(MAXPHYS) + ptoa(uvmexp.ncolors), ptoa(uvmexp.ncolors),
     99      1.105      matt 	    UVM_KMF_VAONLY);
    100      1.105      matt 
    101      1.105      matt 	KASSERT(new_emergva != 0);
    102      1.105      matt 
    103      1.105      matt 	old_emergva = emergva;
    104      1.105      matt 	old_emerg_ncolors = emerg_ncolors;
    105      1.105      matt 
    106      1.105      matt 	/*
    107      1.105      matt 	 * don't support re-color in late boot anyway.
    108      1.105      matt 	 */
    109      1.105      matt 	if (0) /* XXX */
    110      1.105      matt 		mutex_enter(&pager_map_wanted_lock);
    111      1.105      matt 
    112      1.105      matt 	emergva = new_emergva;
    113      1.105      matt 	emerg_ncolors = uvmexp.ncolors;
    114      1.105      matt 	wakeup(&old_emergva);
    115      1.105      matt 
    116      1.105      matt 	if (0) /* XXX */
    117      1.105      matt 		mutex_exit(&pager_map_wanted_lock);
    118      1.105      matt 
    119      1.105      matt 	if (old_emergva)
    120      1.105      matt 		uvm_km_free(kernel_map, old_emergva,
    121      1.105      matt 		    round_page(MAXPHYS) + ptoa(old_emerg_ncolors),
    122      1.105      matt 		    UVM_KMF_VAONLY);
    123      1.105      matt }
    124      1.105      matt 
    125        1.1       mrg /*
    126        1.1       mrg  * uvm_pager_init: init pagers (at boot time)
    127        1.1       mrg  */
    128        1.1       mrg 
    129        1.6       mrg void
    130       1.67   thorpej uvm_pager_init(void)
    131        1.6       mrg {
    132       1.59   thorpej 	u_int lcv;
    133       1.50       chs 	vaddr_t sva, eva;
    134        1.1       mrg 
    135        1.6       mrg 	/*
    136        1.6       mrg 	 * init pager map
    137        1.6       mrg 	 */
    138        1.6       mrg 
    139       1.50       chs 	sva = 0;
    140       1.87      yamt 	pager_map = uvm_km_suballoc(kernel_map, &sva, &eva, pager_map_size, 0,
    141       1.81   thorpej 	    false, NULL);
    142       1.84        ad 	mutex_init(&pager_map_wanted_lock, MUTEX_DEFAULT, IPL_NONE);
    143       1.81   thorpej 	pager_map_wanted = false;
    144      1.105      matt 
    145      1.105      matt 	uvm_pager_realloc_emerg();
    146        1.6       mrg 
    147        1.6       mrg 	/*
    148        1.6       mrg 	 * init ASYNC I/O queue
    149        1.6       mrg 	 */
    150       1.45       chs 
    151        1.6       mrg 	TAILQ_INIT(&uvm.aio_done);
    152        1.1       mrg 
    153        1.6       mrg 	/*
    154        1.6       mrg 	 * call pager init functions
    155        1.6       mrg 	 */
    156       1.88      yamt 	for (lcv = 0 ; lcv < __arraycount(uvmpagerops); lcv++) {
    157        1.6       mrg 		if (uvmpagerops[lcv]->pgo_init)
    158        1.6       mrg 			uvmpagerops[lcv]->pgo_init();
    159        1.6       mrg 	}
    160        1.1       mrg }
    161        1.1       mrg 
    162        1.1       mrg /*
    163        1.1       mrg  * uvm_pagermapin: map pages into KVA (pager_map) for I/O that needs mappings
    164        1.1       mrg  *
    165        1.1       mrg  * we basically just map in a blank map entry to reserve the space in the
    166        1.1       mrg  * map and then use pmap_enter() to put the mappings in by hand.
    167        1.1       mrg  */
    168        1.1       mrg 
    169        1.9       eeh vaddr_t
    170       1.67   thorpej uvm_pagermapin(struct vm_page **pps, int npages, int flags)
    171        1.1       mrg {
    172        1.9       eeh 	vsize_t size;
    173        1.9       eeh 	vaddr_t kva;
    174        1.9       eeh 	vaddr_t cva;
    175        1.6       mrg 	struct vm_page *pp;
    176       1.29   thorpej 	vm_prot_t prot;
    177      1.104      matt 	const bool pdaemon = (curlwp == uvm.pagedaemon_lwp);
    178      1.104      matt 	const u_int first_color = VM_PGCOLOR_BUCKET(*pps);
    179        1.6       mrg 	UVMHIST_FUNC("uvm_pagermapin"); UVMHIST_CALLED(maphist);
    180        1.1       mrg 
    181      1.104      matt 	UVMHIST_LOG(maphist,"(pps=0x%x, npages=%d, first_color=%u)",
    182      1.104      matt 		pps, npages, first_color, 0);
    183       1.29   thorpej 
    184       1.29   thorpej 	/*
    185       1.29   thorpej 	 * compute protection.  outgoing I/O only needs read
    186       1.29   thorpej 	 * access to the page, whereas incoming needs read/write.
    187       1.29   thorpej 	 */
    188       1.29   thorpej 
    189       1.29   thorpej 	prot = VM_PROT_READ;
    190       1.29   thorpej 	if (flags & UVMPAGER_MAPIN_READ)
    191       1.29   thorpej 		prot |= VM_PROT_WRITE;
    192        1.1       mrg 
    193        1.1       mrg ReStart:
    194      1.104      matt 	size = ptoa(npages);
    195       1.29   thorpej 	kva = 0;			/* let system choose VA */
    196        1.1       mrg 
    197      1.104      matt 	if (uvm_map(pager_map, &kva, size, NULL, UVM_UNKNOWN_OFFSET,
    198      1.104      matt 	    first_color, UVM_FLAG_COLORMATCH | UVM_FLAG_NOMERGE
    199      1.104      matt 	    | (pdaemon ? UVM_FLAG_NOWAIT : 0)) != 0) {
    200       1.75      yamt 		if (pdaemon) {
    201       1.84        ad 			mutex_enter(&pager_map_wanted_lock);
    202       1.35       chs 			if (emerginuse) {
    203       1.90        ad 				UVM_UNLOCK_AND_WAIT(&emergva,
    204       1.90        ad 				    &pager_map_wanted_lock, false,
    205       1.90        ad 				    "emergva", 0);
    206       1.35       chs 				goto ReStart;
    207       1.35       chs 			}
    208       1.81   thorpej 			emerginuse = true;
    209       1.84        ad 			mutex_exit(&pager_map_wanted_lock);
    210      1.104      matt 			kva = emergva + ptoa(first_color);
    211       1.60       tls 			/* The shift implicitly truncates to PAGE_SIZE */
    212       1.60       tls 			KASSERT(npages <= (MAXPHYS >> PAGE_SHIFT));
    213       1.35       chs 			goto enter;
    214       1.35       chs 		}
    215       1.29   thorpej 		if ((flags & UVMPAGER_MAPIN_WAITOK) == 0) {
    216        1.6       mrg 			UVMHIST_LOG(maphist,"<- NOWAIT failed", 0,0,0,0);
    217       1.29   thorpej 			return(0);
    218        1.6       mrg 		}
    219       1.84        ad 		mutex_enter(&pager_map_wanted_lock);
    220       1.81   thorpej 		pager_map_wanted = true;
    221        1.6       mrg 		UVMHIST_LOG(maphist, "  SLEEPING on pager_map",0,0,0,0);
    222       1.90        ad 		UVM_UNLOCK_AND_WAIT(pager_map, &pager_map_wanted_lock, false,
    223       1.90        ad 		    "pager_map", 0);
    224        1.6       mrg 		goto ReStart;
    225        1.6       mrg 	}
    226        1.1       mrg 
    227       1.35       chs enter:
    228        1.6       mrg 	/* got it */
    229      1.104      matt 	for (cva = kva; npages != 0; npages--, cva += PAGE_SIZE) {
    230        1.6       mrg 		pp = *pps++;
    231       1.40       mrg 		KASSERT(pp);
    232      1.104      matt 		// KASSERT(!((VM_PAGE_TO_PHYS(pp) ^ cva) & uvmexp.colormask));
    233       1.38       chs 		KASSERT(pp->flags & PG_BUSY);
    234       1.97    cegger 		pmap_kenter_pa(cva, VM_PAGE_TO_PHYS(pp), prot, 0);
    235        1.6       mrg 	}
    236       1.49     chris 	pmap_update(vm_map_pmap(pager_map));
    237        1.1       mrg 
    238        1.6       mrg 	UVMHIST_LOG(maphist, "<- done (KVA=0x%x)", kva,0,0,0);
    239        1.6       mrg 	return(kva);
    240        1.1       mrg }
    241        1.1       mrg 
    242        1.1       mrg /*
    243        1.1       mrg  * uvm_pagermapout: remove pager_map mapping
    244        1.1       mrg  *
    245        1.1       mrg  * we remove our mappings by hand and then remove the mapping (waking
    246        1.1       mrg  * up anyone wanting space).
    247        1.1       mrg  */
    248        1.1       mrg 
    249        1.6       mrg void
    250       1.67   thorpej uvm_pagermapout(vaddr_t kva, int npages)
    251        1.6       mrg {
    252      1.104      matt 	vsize_t size = ptoa(npages);
    253       1.47       chs 	struct vm_map_entry *entries;
    254        1.6       mrg 	UVMHIST_FUNC("uvm_pagermapout"); UVMHIST_CALLED(maphist);
    255       1.35       chs 
    256        1.6       mrg 	UVMHIST_LOG(maphist, " (kva=0x%x, npages=%d)", kva, npages,0,0);
    257        1.1       mrg 
    258        1.6       mrg 	/*
    259        1.6       mrg 	 * duplicate uvm_unmap, but add in pager_map_wanted handling.
    260        1.6       mrg 	 */
    261        1.6       mrg 
    262      1.104      matt 	pmap_kremove(kva, size);
    263       1.98     rmind 	pmap_update(pmap_kernel());
    264       1.98     rmind 
    265      1.104      matt 	if ((kva & ~ptoa(uvmexp.colormask)) == emergva) {
    266       1.84        ad 		mutex_enter(&pager_map_wanted_lock);
    267      1.106  uebayasi 		KASSERT(emerginuse);
    268       1.81   thorpej 		emerginuse = false;
    269       1.35       chs 		wakeup(&emergva);
    270       1.84        ad 		mutex_exit(&pager_map_wanted_lock);
    271       1.50       chs 		return;
    272       1.35       chs 	}
    273       1.35       chs 
    274        1.6       mrg 	vm_map_lock(pager_map);
    275       1.66      yamt 	uvm_unmap_remove(pager_map, kva, kva + size, &entries, NULL, 0);
    276       1.84        ad 	mutex_enter(&pager_map_wanted_lock);
    277        1.6       mrg 	if (pager_map_wanted) {
    278       1.81   thorpej 		pager_map_wanted = false;
    279        1.6       mrg 		wakeup(pager_map);
    280        1.6       mrg 	}
    281       1.84        ad 	mutex_exit(&pager_map_wanted_lock);
    282        1.6       mrg 	vm_map_unlock(pager_map);
    283        1.6       mrg 	if (entries)
    284        1.6       mrg 		uvm_unmap_detach(entries, 0);
    285        1.6       mrg 	UVMHIST_LOG(maphist,"<- done",0,0,0,0);
    286        1.1       mrg }
    287        1.1       mrg 
    288        1.1       mrg /*
    289       1.35       chs  * interrupt-context iodone handler for single-buf i/os
    290       1.35       chs  * or the top-level buf of a nested-buf i/o.
    291       1.35       chs  */
    292       1.35       chs 
    293       1.35       chs void
    294       1.67   thorpej uvm_aio_biodone(struct buf *bp)
    295       1.35       chs {
    296       1.35       chs 	/* reset b_iodone for when this is a single-buf i/o. */
    297       1.35       chs 	bp->b_iodone = uvm_aio_aiodone;
    298       1.35       chs 
    299       1.83     rmind 	workqueue_enqueue(uvm.aiodone_queue, &bp->b_work, NULL);
    300       1.35       chs }
    301       1.35       chs 
    302       1.35       chs void
    303       1.91      yamt uvm_aio_aiodone_pages(struct vm_page **pgs, int npages, bool write, int error)
    304       1.35       chs {
    305       1.35       chs 	struct uvm_object *uobj;
    306       1.91      yamt 	struct vm_page *pg;
    307       1.90        ad 	kmutex_t *slock;
    308      1.107      yamt 	int pageout_done;	/* number of PG_PAGEOUT pages processed */
    309       1.91      yamt 	int swslot;
    310       1.91      yamt 	int i;
    311       1.91      yamt 	bool swap;
    312       1.92    simonb 	UVMHIST_FUNC("uvm_aio_aiodone_pages"); UVMHIST_CALLED(ubchist);
    313       1.50       chs 
    314       1.50       chs 	swslot = 0;
    315       1.91      yamt 	pageout_done = 0;
    316       1.50       chs 	slock = NULL;
    317       1.91      yamt 	uobj = NULL;
    318       1.55       chs 	pg = pgs[0];
    319       1.55       chs 	swap = (pg->uanon != NULL && pg->uobject == NULL) ||
    320       1.55       chs 		(pg->pqflags & PQ_AOBJ) != 0;
    321       1.50       chs 	if (!swap) {
    322       1.55       chs 		uobj = pg->uobject;
    323      1.101     rmind 		slock = uobj->vmobjlock;
    324       1.90        ad 		mutex_enter(slock);
    325       1.90        ad 		mutex_enter(&uvm_pageqlock);
    326       1.71      yamt 	} else {
    327       1.71      yamt #if defined(VMSWAP)
    328       1.71      yamt 		if (error) {
    329       1.71      yamt 			if (pg->uobject != NULL) {
    330       1.71      yamt 				swslot = uao_find_swslot(pg->uobject,
    331       1.71      yamt 				    pg->offset >> PAGE_SHIFT);
    332       1.77  christos 			} else {
    333       1.77  christos 				KASSERT(pg->uanon != NULL);
    334       1.71      yamt 				swslot = pg->uanon->an_swslot;
    335       1.71      yamt 			}
    336       1.71      yamt 			KASSERT(swslot);
    337       1.50       chs 		}
    338       1.71      yamt #else /* defined(VMSWAP) */
    339       1.71      yamt 		panic("%s: swap", __func__);
    340       1.71      yamt #endif /* defined(VMSWAP) */
    341       1.50       chs 	}
    342       1.35       chs 	for (i = 0; i < npages; i++) {
    343      1.103       oki #if defined(VMSWAP)
    344      1.102      yamt 		bool anon_disposed = false; /* XXX gcc */
    345      1.103       oki #endif /* defined(VMSWAP) */
    346      1.102      yamt 
    347       1.35       chs 		pg = pgs[i];
    348       1.50       chs 		KASSERT(swap || pg->uobject == uobj);
    349       1.50       chs 		UVMHIST_LOG(ubchist, "pg %p", pg, 0,0,0);
    350       1.50       chs 
    351       1.71      yamt #if defined(VMSWAP)
    352       1.50       chs 		/*
    353       1.50       chs 		 * for swap i/os, lock each page's object (or anon)
    354       1.50       chs 		 * individually since each page may need a different lock.
    355       1.50       chs 		 */
    356       1.35       chs 
    357       1.35       chs 		if (swap) {
    358       1.55       chs 			if (pg->uobject != NULL) {
    359      1.101     rmind 				slock = pg->uobject->vmobjlock;
    360       1.55       chs 			} else {
    361      1.101     rmind 				slock = pg->uanon->an_lock;
    362       1.35       chs 			}
    363       1.90        ad 			mutex_enter(slock);
    364       1.90        ad 			mutex_enter(&uvm_pageqlock);
    365      1.102      yamt 			anon_disposed = (pg->flags & PG_RELEASED) != 0;
    366      1.102      yamt 			KASSERT(!anon_disposed || pg->uobject != NULL ||
    367      1.102      yamt 			    pg->uanon->an_ref == 0);
    368       1.50       chs 		}
    369       1.71      yamt #endif /* defined(VMSWAP) */
    370       1.50       chs 
    371       1.50       chs 		/*
    372       1.50       chs 		 * process errors.  for reads, just mark the page to be freed.
    373       1.50       chs 		 * for writes, if the error was ENOMEM, we assume this was
    374       1.50       chs 		 * a transient failure so we mark the page dirty so that
    375       1.50       chs 		 * we'll try to write it again later.  for all other write
    376       1.50       chs 		 * errors, we assume the error is permanent, thus the data
    377       1.50       chs 		 * in the page is lost.  bummer.
    378       1.50       chs 		 */
    379       1.50       chs 
    380       1.50       chs 		if (error) {
    381       1.61        pk 			int slot;
    382       1.50       chs 			if (!write) {
    383       1.50       chs 				pg->flags |= PG_RELEASED;
    384       1.50       chs 				continue;
    385       1.50       chs 			} else if (error == ENOMEM) {
    386       1.50       chs 				if (pg->flags & PG_PAGEOUT) {
    387       1.50       chs 					pg->flags &= ~PG_PAGEOUT;
    388       1.90        ad 					pageout_done++;
    389       1.50       chs 				}
    390  1.107.2.1      yamt 				uvm_pagemarkdirty(pg, UVM_PAGE_STATUS_DIRTY);
    391       1.50       chs 				uvm_pageactivate(pg);
    392       1.61        pk 				slot = 0;
    393       1.61        pk 			} else
    394       1.61        pk 				slot = SWSLOT_BAD;
    395       1.61        pk 
    396       1.71      yamt #if defined(VMSWAP)
    397       1.61        pk 			if (swap) {
    398       1.61        pk 				if (pg->uobject != NULL) {
    399       1.62        pk 					int oldslot;
    400       1.62        pk 					oldslot = uao_set_swslot(pg->uobject,
    401       1.62        pk 						pg->offset >> PAGE_SHIFT, slot);
    402       1.62        pk 					KASSERT(oldslot == swslot + i);
    403       1.61        pk 				} else {
    404       1.61        pk 					KASSERT(pg->uanon->an_swslot ==
    405       1.61        pk 						swslot + i);
    406       1.61        pk 					pg->uanon->an_swslot = slot;
    407       1.61        pk 				}
    408       1.50       chs 			}
    409       1.71      yamt #endif /* defined(VMSWAP) */
    410       1.50       chs 		}
    411       1.50       chs 
    412       1.50       chs 		/*
    413       1.50       chs 		 * if the page is PG_FAKE, this must have been a read to
    414       1.50       chs 		 * initialize the page.  clear PG_FAKE and activate the page.
    415       1.50       chs 		 */
    416       1.50       chs 
    417       1.50       chs 		if (pg->flags & PG_FAKE) {
    418       1.50       chs 			KASSERT(!write);
    419       1.50       chs 			pg->flags &= ~PG_FAKE;
    420       1.72      yamt #if defined(READAHEAD_STATS)
    421       1.78      yamt 			pg->pqflags |= PQ_READAHEAD;
    422       1.72      yamt 			uvm_ra_total.ev_count++;
    423       1.72      yamt #endif /* defined(READAHEAD_STATS) */
    424  1.107.2.1      yamt 			KASSERT(uvm_pagegetdirty(pg) == UVM_PAGE_STATUS_CLEAN);
    425       1.78      yamt 			uvm_pageenqueue(pg);
    426       1.35       chs 		}
    427       1.35       chs 
    428       1.35       chs 		/*
    429       1.53       chs 		 * do accounting for pagedaemon i/o and arrange to free
    430       1.53       chs 		 * the pages instead of just unbusying them.
    431       1.35       chs 		 */
    432       1.35       chs 
    433       1.53       chs 		if (pg->flags & PG_PAGEOUT) {
    434       1.50       chs 			pg->flags &= ~PG_PAGEOUT;
    435       1.90        ad 			pageout_done++;
    436       1.64     enami 			uvmexp.pdfreed++;
    437       1.35       chs 			pg->flags |= PG_RELEASED;
    438       1.35       chs 		}
    439       1.35       chs 
    440       1.71      yamt #if defined(VMSWAP)
    441       1.35       chs 		/*
    442       1.50       chs 		 * for swap pages, unlock everything for this page now.
    443       1.35       chs 		 */
    444       1.35       chs 
    445       1.35       chs 		if (swap) {
    446      1.102      yamt 			if (pg->uobject == NULL && anon_disposed) {
    447       1.90        ad 				mutex_exit(&uvm_pageqlock);
    448       1.63      yamt 				uvm_anon_release(pg->uanon);
    449       1.63      yamt 			} else {
    450       1.63      yamt 				uvm_page_unbusy(&pg, 1);
    451       1.90        ad 				mutex_exit(&uvm_pageqlock);
    452       1.90        ad 				mutex_exit(slock);
    453       1.63      yamt 			}
    454       1.35       chs 		}
    455       1.71      yamt #endif /* defined(VMSWAP) */
    456       1.35       chs 	}
    457       1.90        ad 	uvm_pageout_done(pageout_done);
    458       1.35       chs 	if (!swap) {
    459       1.50       chs 		uvm_page_unbusy(pgs, npages);
    460       1.90        ad 		mutex_exit(&uvm_pageqlock);
    461       1.90        ad 		mutex_exit(slock);
    462       1.50       chs 	} else {
    463       1.71      yamt #if defined(VMSWAP)
    464       1.53       chs 		KASSERT(write);
    465       1.53       chs 
    466       1.53       chs 		/* these pages are now only in swap. */
    467       1.84        ad 		mutex_enter(&uvm_swap_data_lock);
    468       1.53       chs 		KASSERT(uvmexp.swpgonly + npages <= uvmexp.swpginuse);
    469       1.61        pk 		if (error != ENOMEM)
    470       1.61        pk 			uvmexp.swpgonly += npages;
    471       1.84        ad 		mutex_exit(&uvm_swap_data_lock);
    472       1.50       chs 		if (error) {
    473       1.61        pk 			if (error != ENOMEM)
    474       1.61        pk 				uvm_swap_markbad(swslot, npages);
    475       1.61        pk 			else
    476       1.61        pk 				uvm_swap_free(swslot, npages);
    477       1.50       chs 		}
    478       1.61        pk 		uvmexp.pdpending--;
    479       1.71      yamt #endif /* defined(VMSWAP) */
    480       1.35       chs 	}
    481       1.91      yamt }
    482       1.91      yamt 
    483       1.91      yamt /*
    484       1.91      yamt  * uvm_aio_aiodone: do iodone processing for async i/os.
    485       1.91      yamt  * this should be called in thread context, not interrupt context.
    486       1.91      yamt  */
    487       1.91      yamt 
    488       1.91      yamt void
    489       1.91      yamt uvm_aio_aiodone(struct buf *bp)
    490       1.91      yamt {
    491       1.91      yamt 	int npages = bp->b_bufsize >> PAGE_SHIFT;
    492       1.91      yamt 	struct vm_page *pgs[npages];
    493       1.91      yamt 	int i, error;
    494       1.91      yamt 	bool write;
    495       1.91      yamt 	UVMHIST_FUNC("uvm_aio_aiodone"); UVMHIST_CALLED(ubchist);
    496       1.91      yamt 	UVMHIST_LOG(ubchist, "bp %p", bp, 0,0,0);
    497       1.91      yamt 
    498       1.91      yamt 	error = bp->b_error;
    499       1.91      yamt 	write = (bp->b_flags & B_READ) == 0;
    500       1.91      yamt 
    501       1.91      yamt 	for (i = 0; i < npages; i++) {
    502       1.91      yamt 		pgs[i] = uvm_pageratop((vaddr_t)bp->b_data + (i << PAGE_SHIFT));
    503       1.91      yamt 		UVMHIST_LOG(ubchist, "pgs[%d] = %p", i, pgs[i],0,0);
    504       1.91      yamt 	}
    505       1.91      yamt 	uvm_pagermapout((vaddr_t)bp->b_data, npages);
    506       1.91      yamt 
    507       1.91      yamt 	uvm_aio_aiodone_pages(pgs, npages, write, error);
    508       1.91      yamt 
    509       1.90        ad 	if (write && (bp->b_cflags & BC_AGE) != 0) {
    510       1.90        ad 		mutex_enter(bp->b_objlock);
    511       1.35       chs 		vwakeup(bp);
    512       1.90        ad 		mutex_exit(bp->b_objlock);
    513       1.35       chs 	}
    514       1.73      yamt 	putiobuf(bp);
    515        1.1       mrg }
    516       1.74      yamt 
    517       1.74      yamt /*
    518       1.74      yamt  * uvm_pageratop: convert KVAs in the pager map back to their page
    519       1.74      yamt  * structures.
    520       1.74      yamt  */
    521       1.74      yamt 
    522       1.74      yamt struct vm_page *
    523       1.74      yamt uvm_pageratop(vaddr_t kva)
    524       1.74      yamt {
    525       1.74      yamt 	struct vm_page *pg;
    526       1.74      yamt 	paddr_t pa;
    527       1.80   thorpej 	bool rv;
    528       1.74      yamt 
    529       1.74      yamt 	rv = pmap_extract(pmap_kernel(), kva, &pa);
    530       1.74      yamt 	KASSERT(rv);
    531       1.74      yamt 	pg = PHYS_TO_VM_PAGE(pa);
    532       1.74      yamt 	KASSERT(pg != NULL);
    533       1.74      yamt 	return (pg);
    534       1.74      yamt }
    535