uvm_page.h revision 1.73.2.11 1 /* $NetBSD: uvm_page.h,v 1.73.2.11 2012/05/23 10:08:20 yamt Exp $ */
2
3 /*
4 * Copyright (c) 1997 Charles D. Cranor and Washington University.
5 * Copyright (c) 1991, 1993, The Regents of the University of California.
6 *
7 * All rights reserved.
8 *
9 * This code is derived from software contributed to Berkeley by
10 * The Mach Operating System project at Carnegie-Mellon University.
11 *
12 * Redistribution and use in source and binary forms, with or without
13 * modification, are permitted provided that the following conditions
14 * are met:
15 * 1. Redistributions of source code must retain the above copyright
16 * notice, this list of conditions and the following disclaimer.
17 * 2. Redistributions in binary form must reproduce the above copyright
18 * notice, this list of conditions and the following disclaimer in the
19 * documentation and/or other materials provided with the distribution.
20 * 3. Neither the name of the University nor the names of its contributors
21 * may be used to endorse or promote products derived from this software
22 * without specific prior written permission.
23 *
24 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
25 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
26 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
27 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
28 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
29 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
30 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
31 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
32 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
33 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
34 * SUCH DAMAGE.
35 *
36 * @(#)vm_page.h 7.3 (Berkeley) 4/21/91
37 * from: Id: uvm_page.h,v 1.1.2.6 1998/02/04 02:31:42 chuck Exp
38 *
39 *
40 * Copyright (c) 1987, 1990 Carnegie-Mellon University.
41 * All rights reserved.
42 *
43 * Permission to use, copy, modify and distribute this software and
44 * its documentation is hereby granted, provided that both the copyright
45 * notice and this permission notice appear in all copies of the
46 * software, derivative works or modified versions, and any portions
47 * thereof, and that both notices appear in supporting documentation.
48 *
49 * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS"
50 * CONDITION. CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND
51 * FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
52 *
53 * Carnegie Mellon requests users of this software to return to
54 *
55 * Software Distribution Coordinator or Software.Distribution (at) CS.CMU.EDU
56 * School of Computer Science
57 * Carnegie Mellon University
58 * Pittsburgh PA 15213-3890
59 *
60 * any improvements or extensions that they make and grant Carnegie the
61 * rights to redistribute these changes.
62 */
63
64 #ifndef _UVM_UVM_PAGE_H_
65 #define _UVM_UVM_PAGE_H_
66
67 #include <uvm/uvm_extern.h>
68 #include <uvm/uvm_pglist.h>
69
70 /*
71 * Management of resident (logical) pages.
72 *
73 * Each resident page has a vm_page structure, indexed by page number.
74 * There are several lists in the structure:
75 *
76 * - A radix tree rooted with the containing object is used to
77 * quickly perform object+offset lookups.
78 * - An ordered list of pages due for pageout.
79 *
80 * In addition, the structure contains the object and offset to which
81 * this page belongs (for pageout) and sundry status bits.
82 *
83 * Note that the page structure has no lock of its own. The page is
84 * generally protected by its owner's lock (UVM object or amap/anon).
85 * It should be noted that UVM has to serialize pmap(9) operations on
86 * the managed pages, e.g. for pmap_enter() calls. Hence, the lock
87 * order is as follows:
88 *
89 * [vmpage-owner-lock] ->
90 * any pmap locks (e.g. PV hash lock)
91 *
92 * Since the kernel is always self-consistent, no serialization is
93 * required for unmanaged mappings, e.g. for pmap_kenter_pa() calls.
94 *
95 * Field markings and the corresponding locks:
96 *
97 * o: page owner's lock (UVM object or amap/anon)
98 * p: lock on the page queues
99 * o|p: either lock can be acquired
100 * o&p: both locks are required
101 * ?: locked by pmap or assumed page owner's lock
102 *
103 * UVM and pmap(9) may use uvm_page_locked_p() to assert whether the
104 * page owner's lock is acquired.
105 */
106
107 struct vm_page {
108 union {
109 TAILQ_ENTRY(vm_page) queue;
110 LIST_ENTRY(vm_page) list;
111 } pageq; /* p: queue info for FIFO
112 * queue or free list */
113
114 union {
115 struct {
116 struct vm_anon *o_anon; /* o,p: anon */
117 struct uvm_object *o_object; /* o,p: object */
118 } owner;
119 #define uanon u.owner.o_anon
120 #define uobject u.owner.o_object
121 LIST_ENTRY(vm_page) cpulist;
122 } u;
123 voff_t offset; /* o,p: offset into object */
124 uint16_t flags; /* o: object flags */
125 uint16_t loan_count; /* number of active loans
126 * o|p: for reading
127 * o&p: for modification */
128 uint16_t wire_count; /* p: wired down map refs */
129 uint16_t pqflags; /* p: page queue flags */
130 paddr_t phys_addr; /* physical address of page */
131
132 #ifdef __HAVE_VM_PAGE_MD
133 struct vm_page_md mdpage; /* ?: pmap-specific data */
134 #endif
135
136 #if defined(UVM_PAGE_TRKOWN)
137 /* debugging fields to track page ownership */
138 pid_t owner; /* proc that set PG_BUSY */
139 lwpid_t lowner; /* lwp that set PG_BUSY */
140 const char *owner_tag; /* why it was set busy */
141 #endif
142 };
143
144 /*
145 * Overview of UVM page flags.
146 *
147 * Locking notes:
148 *
149 * PG_, struct vm_page::flags => locked by the owner
150 * PQ_, struct vm_page::pqflags => locked by the page-queue lock
151 * PQ_FREE => additionally locked by free-queue lock
152 *
153 * Flag descriptions:
154 *
155 * PG_CLEAN:
156 * Page is known clean.
157 * The contents of the page is consistent with its backing store.
158 *
159 * PG_DIRTY:
160 * Page is known dirty.
161 * To avoid losing data, the contents of the page should be written
162 * back to the backing store before freeing the page.
163 *
164 * PG_BUSY:
165 * Page is long-term locked, usually because of I/O (transfer from the
166 * page memory to the backing store) is in progress. LWP attempting
167 * to access the page shall set PG_WANTED and wait.
168 *
169 * PG_WANTED:
170 * Indicates that the page, which is currently PG_BUSY, is wanted by
171 * some other LWP. The page owner (i.e. LWP which set PG_BUSY) is
172 * responsible to clear both flags and wake up any waiters once it has
173 * released the long-term lock (PG_BUSY).
174 *
175 * PG_PAGEOUT:
176 * Indicates that the page is being paged-out in preparation for
177 * being freed.
178 *
179 * PG_RELEASED:
180 * Indicates that the page, which is currently PG_BUSY, should be freed
181 * after the release of long-term lock. It is responsibility of the
182 * owning LWP (i.e. which set PG_BUSY) to do it.
183 *
184 * PG_FAKE:
185 * Page has been allocated, but not yet initialised. The flag is used
186 * to avoid overwriting of valid data, e.g. to prevent read from the
187 * backing store when in-core data is newer.
188 *
189 * PG_RDONLY:
190 * Indicates that the page must be mapped read-only.
191 *
192 * PG_ZERO:
193 * Indicates that the page has been pre-zeroed. This flag is only
194 * set when the page is not in the queues and is cleared when the
195 * page is placed on the free list.
196 *
197 * PG_TABLED:
198 * Indicates that the page is currently in the object's offset queue,
199 * and that it should be removed from it once the page is freed. Used
200 * diagnostic purposes.
201 */
202
203 /*
204 * if you want to renumber PG_CLEAN and PG_DIRTY, check __CTASSERTs in
205 * uvm_page_status.c first.
206 */
207
208 #define PG_CLEAN 0x0001 /* page is known clean */
209 #define PG_DIRTY 0x0002 /* page is known dirty */
210 #define PG_BUSY 0x0004 /* page is locked */
211 #define PG_WANTED 0x0008 /* someone is waiting for page */
212 #define PG_PAGEOUT 0x0010 /* page to be freed for pagedaemon */
213 #define PG_RELEASED 0x0020 /* page to be freed when unbusied */
214 #define PG_FAKE 0x0040 /* page is not yet initialized */
215 #define PG_RDONLY 0x0080 /* page must be mapped read-only */
216 #define PG_ZERO 0x0100 /* page is pre-zero'd */
217 #define PG_TABLED 0x0200 /* page is in VP table */
218
219 #define PG_PAGER1 0x1000 /* pager-specific flag */
220 #define PG_PAGER2 0x2000 /* pager-specific flag */
221
222 #define UVM_PGFLAGBITS \
223 "\20\1CLEAN\2DIRTY\3BUSY\4WANTED" \
224 "\5PAGEOUT\6RELEASED\7FAKE\10RDONLY" \
225 "\11ZERO\12TABLED" \
226 "\15PAGER1\16PAGER2"
227
228 #define PQ_FREE 0x0001 /* page is on free list */
229 #define PQ_ANON 0x0002 /* page is part of an anon, rather
230 than an uvm_object */
231 #define PQ_AOBJ 0x0004 /* page is part of an anonymous
232 uvm_object */
233 #define PQ_SWAPBACKED (PQ_ANON|PQ_AOBJ)
234 #define PQ_READAHEAD 0x0008 /* read-ahead but has not been "hit" yet */
235 #define PQ_FILE 0x0010 /* file backed (non-anonymous) */
236 #define PQ_STAT (PQ_ANON|PQ_AOBJ|PQ_FILE)
237
238 #define PQ_PRIVATE1 0x0100
239 #define PQ_PRIVATE2 0x0200
240 #define PQ_PRIVATE3 0x0400
241 #define PQ_PRIVATE4 0x0800
242 #define PQ_PRIVATE5 0x1000
243 #define PQ_PRIVATE6 0x2000
244 #define PQ_PRIVATE7 0x4000
245 #define PQ_PRIVATE8 0x8000
246
247 #define UVM_PQFLAGBITS \
248 "\20\1FREE\2ANON\3AOBJ\4READAHEAD\5FILE" \
249 "\11PRIVATE1\12PRIVATE2\13PRIVATE3\14PRIVATE4" \
250 "\15PRIVATE5\16PRIVATE6\17PRIVATE7\20PRIVATE8"
251
252 /*
253 * physical memory layout structure
254 *
255 * MD vmparam.h must #define:
256 * VM_PHYSEG_MAX = max number of physical memory segments we support
257 * (if this is "1" then we revert to a "contig" case)
258 * VM_PHYSSEG_STRAT: memory sort/search options (for VM_PHYSEG_MAX > 1)
259 * - VM_PSTRAT_RANDOM: linear search (random order)
260 * - VM_PSTRAT_BSEARCH: binary search (sorted by address)
261 * - VM_PSTRAT_BIGFIRST: linear search (sorted by largest segment first)
262 * - others?
263 * XXXCDC: eventually we should purge all left-over global variables...
264 */
265 #define VM_PSTRAT_RANDOM 1
266 #define VM_PSTRAT_BSEARCH 2
267 #define VM_PSTRAT_BIGFIRST 3
268
269 /*
270 * vm_physseg: describes one segment of physical memory
271 */
272 struct vm_physseg {
273 paddr_t start; /* PF# of first page in segment */
274 paddr_t end; /* (PF# of last page in segment) + 1 */
275 paddr_t avail_start; /* PF# of first free page in segment */
276 paddr_t avail_end; /* (PF# of last free page in segment) +1 */
277 struct vm_page *pgs; /* vm_page structures (from start) */
278 struct vm_page *lastpg; /* vm_page structure for end */
279 int free_list; /* which free list they belong on */
280 u_int start_hint; /* start looking for free pages here */
281 /* protected by uvm_fpageqlock */
282 #ifdef __HAVE_PMAP_PHYSSEG
283 struct pmap_physseg pmseg; /* pmap specific (MD) data */
284 #endif
285 };
286
287 #ifdef _KERNEL
288
289 /*
290 * globals
291 */
292
293 extern bool vm_page_zero_enable;
294
295 /*
296 * physical memory config is stored in vm_physmem.
297 */
298
299 #define VM_PHYSMEM_PTR(i) (&vm_physmem[i])
300 #define VM_PHYSMEM_PTR_SWAP(i, j) \
301 do { vm_physmem[(i)] = vm_physmem[(j)]; } while (0)
302
303 extern struct vm_physseg vm_physmem[VM_PHYSSEG_MAX];
304 extern int vm_nphysseg;
305
306 /*
307 * prototypes: the following prototypes define the interface to pages
308 */
309
310 void uvm_page_init(vaddr_t *, vaddr_t *);
311 #if defined(UVM_PAGE_TRKOWN)
312 void uvm_page_own(struct vm_page *, const char *);
313 #endif
314 #if !defined(PMAP_STEAL_MEMORY)
315 bool uvm_page_physget(paddr_t *);
316 #endif
317 void uvm_page_recolor(int);
318 void uvm_pageidlezero(void);
319
320 void uvm_pageactivate(struct vm_page *);
321 vaddr_t uvm_pageboot_alloc(vsize_t);
322 void uvm_pagecopy(struct vm_page *, struct vm_page *);
323 void uvm_pagedeactivate(struct vm_page *);
324 void uvm_pagedequeue(struct vm_page *);
325 void uvm_pageenqueue(struct vm_page *);
326 void uvm_pagefree(struct vm_page *);
327 void uvm_page_unbusy(struct vm_page **, int);
328 struct vm_page *uvm_pagelookup(struct uvm_object *, voff_t);
329 void uvm_pageunwire(struct vm_page *);
330 void uvm_pagewire(struct vm_page *);
331 void uvm_pagezero(struct vm_page *);
332 bool uvm_pageismanaged(paddr_t);
333 unsigned int uvm_pagegetdirty(struct vm_page *);
334 void uvm_pagemarkdirty(struct vm_page *, unsigned int);
335 bool uvm_pagecheckdirty(struct vm_page *, bool);
336 bool uvm_pagereadonly_p(struct vm_page *);
337 bool uvm_page_locked_p(struct vm_page *);
338 kmutex_t *uvm_page_getlock(struct vm_page *);
339 bool uvm_page_samelock_p(struct vm_page *, struct vm_page *);
340
341 struct uvm_cpu;
342 struct uvm_cpu *uvm_cpu_get(void);
343 void uvm_cpu_put(struct uvm_cpu *);
344
345 /*
346 * page dirtiness status for uvm_pagegetdirty and uvm_pagemarkdirty
347 *
348 * UNKNOWN means that we need to consult pmap to know if the page is
349 * dirty or not.
350 * basically, UVM_PAGE_STATUS_CLEAN implies that the page has no writable
351 * mapping.
352 *
353 * if you want to renumber these, check __CTASSERTs in
354 * uvm_page_status.c first.
355 */
356 #define UVM_PAGE_STATUS_UNKNOWN 0
357 #define UVM_PAGE_STATUS_CLEAN 1
358 #define UVM_PAGE_STATUS_DIRTY 2
359 #define UVM_PAGE_NUM_STATUS 3
360
361 int uvm_page_lookup_freelist(struct vm_page *);
362
363 int vm_physseg_find(paddr_t, int *);
364 struct vm_page *uvm_phys_to_vm_page(paddr_t);
365 paddr_t uvm_vm_page_to_phys(const struct vm_page *);
366
367 /*
368 * macros
369 */
370
371 #define VM_PAGE_TO_PHYS(entry) uvm_vm_page_to_phys(entry)
372
373 #ifdef __HAVE_VM_PAGE_MD
374 #define VM_PAGE_TO_MD(pg) (&(pg)->mdpage)
375 #endif
376
377 /*
378 * Compute the page color bucket for a given page.
379 */
380 #define VM_PGCOLOR_BUCKET(pg) \
381 (atop(VM_PAGE_TO_PHYS((pg))) & uvmexp.colormask)
382
383 #define PHYS_TO_VM_PAGE(pa) uvm_phys_to_vm_page(pa)
384
385 #define VM_PAGE_IS_FREE(entry) ((entry)->pqflags & PQ_FREE)
386 #define VM_FREE_PAGE_TO_CPU(pg) ((struct uvm_cpu *)((uintptr_t)pg->offset))
387
388 #ifdef DEBUG
389 void uvm_pagezerocheck(struct vm_page *);
390 #endif /* DEBUG */
391
392 #endif /* _KERNEL */
393
394 #endif /* _UVM_UVM_PAGE_H_ */
395