Home | History | Annotate | Line # | Download | only in include
pte.h revision 1.15.48.1
      1  1.15.48.1    joerg /*	$NetBSD: pte.h,v 1.15.48.1 2007/10/26 15:42:38 joerg Exp $	*/
      2  1.15.48.1    joerg 
      3  1.15.48.1    joerg /*
      4  1.15.48.1    joerg  * Copyright (c) 2001 Wasabi Systems, Inc.
      5  1.15.48.1    joerg  * All rights reserved.
      6  1.15.48.1    joerg  *
      7  1.15.48.1    joerg  * Written by Frank van der Linden for Wasabi Systems, Inc.
      8  1.15.48.1    joerg  *
      9  1.15.48.1    joerg  * Redistribution and use in source and binary forms, with or without
     10  1.15.48.1    joerg  * modification, are permitted provided that the following conditions
     11  1.15.48.1    joerg  * are met:
     12  1.15.48.1    joerg  * 1. Redistributions of source code must retain the above copyright
     13  1.15.48.1    joerg  *    notice, this list of conditions and the following disclaimer.
     14  1.15.48.1    joerg  * 2. Redistributions in binary form must reproduce the above copyright
     15  1.15.48.1    joerg  *    notice, this list of conditions and the following disclaimer in the
     16  1.15.48.1    joerg  *    documentation and/or other materials provided with the distribution.
     17  1.15.48.1    joerg  * 3. All advertising materials mentioning features or use of this software
     18  1.15.48.1    joerg  *    must display the following acknowledgement:
     19  1.15.48.1    joerg  *      This product includes software developed for the NetBSD Project by
     20  1.15.48.1    joerg  *      Wasabi Systems, Inc.
     21  1.15.48.1    joerg  * 4. The name of Wasabi Systems, Inc. may not be used to endorse
     22  1.15.48.1    joerg  *    or promote products derived from this software without specific prior
     23  1.15.48.1    joerg  *    written permission.
     24  1.15.48.1    joerg  *
     25  1.15.48.1    joerg  * THIS SOFTWARE IS PROVIDED BY WASABI SYSTEMS, INC. ``AS IS'' AND
     26  1.15.48.1    joerg  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     27  1.15.48.1    joerg  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     28  1.15.48.1    joerg  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL WASABI SYSTEMS, INC
     29  1.15.48.1    joerg  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     30  1.15.48.1    joerg  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     31  1.15.48.1    joerg  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     32  1.15.48.1    joerg  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     33  1.15.48.1    joerg  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     34  1.15.48.1    joerg  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     35  1.15.48.1    joerg  * POSSIBILITY OF SUCH DAMAGE.
     36  1.15.48.1    joerg  */
     37       1.11  thorpej 
     38       1.10      mrg /*
     39       1.10      mrg  *
     40       1.10      mrg  * Copyright (c) 1997 Charles D. Cranor and Washington University.
     41        1.1      cgd  * All rights reserved.
     42        1.1      cgd  *
     43        1.1      cgd  * Redistribution and use in source and binary forms, with or without
     44        1.1      cgd  * modification, are permitted provided that the following conditions
     45        1.1      cgd  * are met:
     46        1.1      cgd  * 1. Redistributions of source code must retain the above copyright
     47        1.1      cgd  *    notice, this list of conditions and the following disclaimer.
     48        1.1      cgd  * 2. Redistributions in binary form must reproduce the above copyright
     49        1.1      cgd  *    notice, this list of conditions and the following disclaimer in the
     50        1.1      cgd  *    documentation and/or other materials provided with the distribution.
     51        1.1      cgd  * 3. All advertising materials mentioning features or use of this software
     52       1.10      mrg  *    must display the following acknowledgment:
     53       1.10      mrg  *      This product includes software developed by Charles D. Cranor and
     54       1.10      mrg  *      Washington University.
     55       1.10      mrg  * 4. The name of the author may not be used to endorse or promote products
     56       1.10      mrg  *    derived from this software without specific prior written permission.
     57       1.10      mrg  *
     58       1.10      mrg  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
     59       1.10      mrg  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
     60       1.10      mrg  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
     61       1.10      mrg  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
     62       1.10      mrg  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
     63       1.10      mrg  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
     64       1.10      mrg  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
     65       1.10      mrg  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
     66       1.10      mrg  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
     67       1.10      mrg  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
     68        1.1      cgd  */
     69        1.1      cgd 
     70        1.1      cgd /*
     71       1.10      mrg  * pte.h rewritten by chuck based on the jolitz version, plus random
     72       1.10      mrg  * info on the pentium and other processors found on the net.   the
     73       1.10      mrg  * goal of this rewrite is to provide enough documentation on the MMU
     74       1.10      mrg  * hardware that the reader will be able to understand it without having
     75       1.10      mrg  * to refer to a hardware manual.
     76        1.1      cgd  */
     77        1.1      cgd 
     78        1.3   andrew #ifndef _I386_PTE_H_
     79        1.3   andrew #define _I386_PTE_H_
     80        1.3   andrew 
     81       1.10      mrg /*
     82       1.10      mrg  * i386 MMU hardware structure:
     83       1.10      mrg  *
     84       1.10      mrg  * the i386 MMU is a two-level MMU which maps 4GB of virtual memory.
     85       1.10      mrg  * the pagesize is 4K (4096 [0x1000] bytes), although newer pentium
     86       1.10      mrg  * processors can support a 4MB pagesize as well.
     87       1.10      mrg  *
     88       1.10      mrg  * the first level table (segment table?) is called a "page directory"
     89       1.10      mrg  * and it contains 1024 page directory entries (PDEs).   each PDE is
     90       1.10      mrg  * 4 bytes (an int), so a PD fits in a single 4K page.   this page is
     91       1.10      mrg  * the page directory page (PDP).  each PDE in a PDP maps 4MB of space
     92       1.10      mrg  * (1024 * 4MB = 4GB).   a PDE contains the physical address of the
     93       1.10      mrg  * second level table: the page table.   or, if 4MB pages are being used,
     94       1.10      mrg  * then the PDE contains the PA of the 4MB page being mapped.
     95       1.10      mrg  *
     96       1.10      mrg  * a page table consists of 1024 page table entries (PTEs).  each PTE is
     97       1.10      mrg  * 4 bytes (an int), so a page table also fits in a single 4K page.  a
     98       1.10      mrg  * 4K page being used as a page table is called a page table page (PTP).
     99       1.10      mrg  * each PTE in a PTP maps one 4K page (1024 * 4K = 4MB).   a PTE contains
    100       1.10      mrg  * the physical address of the page it maps and some flag bits (described
    101       1.10      mrg  * below).
    102       1.10      mrg  *
    103       1.10      mrg  * the processor has a special register, "cr3", which points to the
    104       1.10      mrg  * the PDP which is currently controlling the mappings of the virtual
    105       1.10      mrg  * address space.
    106       1.10      mrg  *
    107       1.10      mrg  * the following picture shows the translation process for a 4K page:
    108       1.10      mrg  *
    109       1.10      mrg  * %cr3 register [PA of PDP]
    110       1.10      mrg  *      |
    111       1.10      mrg  *      |
    112       1.10      mrg  *      |   bits <31-22> of VA         bits <21-12> of VA   bits <11-0>
    113       1.10      mrg  *      |   index the PDP (0 - 1023)   index the PTP        are the page offset
    114       1.10      mrg  *      |         |                           |                  |
    115       1.10      mrg  *      |         v                           |                  |
    116       1.10      mrg  *      +--->+----------+                     |                  |
    117       1.10      mrg  *           | PD Page  |   PA of             v                  |
    118       1.10      mrg  *           |          |---PTP-------->+------------+           |
    119       1.10      mrg  *           | 1024 PDE |               | page table |--PTE--+   |
    120       1.10      mrg  *           | entries  |               | (aka PTP)  |       |   |
    121       1.10      mrg  *           +----------+               | 1024 PTE   |       |   |
    122       1.10      mrg  *                                      | entries    |       |   |
    123       1.10      mrg  *                                      +------------+       |   |
    124       1.10      mrg  *                                                           |   |
    125       1.10      mrg  *                                                bits <31-12>   bits <11-0>
    126       1.10      mrg  *                                                p h y s i c a l  a d d r
    127       1.10      mrg  *
    128       1.10      mrg  * the i386 caches PTEs in a TLB.   it is important to flush out old
    129       1.10      mrg  * TLB mappings when making a change to a mappings.   writing to the
    130       1.10      mrg  * %cr3 will flush the entire TLB.    newer processors also have an
    131       1.10      mrg  * instruction that will invalidate the mapping of a single page (which
    132       1.10      mrg  * is useful if you are changing a single mappings because it preserves
    133       1.10      mrg  * all the cached TLB entries).
    134       1.10      mrg  *
    135       1.10      mrg  * as shows, bits 31-12 of the PTE contain PA of the page being mapped.
    136       1.10      mrg  * the rest of the PTE is defined as follows:
    137       1.10      mrg  *   bit#	name	use
    138       1.10      mrg  *   11		n/a	available for OS use, hardware ignores it
    139       1.10      mrg  *   10		n/a	available for OS use, hardware ignores it
    140       1.10      mrg  *   9		n/a	available for OS use, hardware ignores it
    141       1.10      mrg  *   8		G	global bit (see discussion below)
    142       1.10      mrg  *   7		PS	page size [for PDEs] (0=4k, 1=4M <if supported>)
    143       1.10      mrg  *   6		D	dirty (modified) page
    144       1.10      mrg  *   5		A	accessed (referenced) page
    145       1.10      mrg  *   4		PCD	cache disable
    146       1.10      mrg  *   3		PWT	prevent write through (cache)
    147       1.10      mrg  *   2		U/S	user/supervisor bit (0=supervisor only, 1=both u&s)
    148       1.10      mrg  *   1		R/W	read/write bit (0=read only, 1=read-write)
    149       1.10      mrg  *   0		P	present (valid)
    150       1.10      mrg  *
    151       1.10      mrg  * notes:
    152       1.10      mrg  *  - on the i386 the R/W bit is ignored if processor is in supervisor
    153       1.10      mrg  *    state (bug!)
    154       1.10      mrg  *  - PS is only supported on newer processors
    155       1.10      mrg  *  - PTEs with the G bit are global in the sense that they are not
    156       1.10      mrg  *    flushed from the TLB when %cr3 is written (to flush, use the
    157       1.10      mrg  *    "flush single page" instruction).   this is only supported on
    158       1.10      mrg  *    newer processors.    this bit can be used to keep the kernel's
    159       1.10      mrg  *    TLB entries around while context switching.   since the kernel
    160       1.10      mrg  *    is mapped into all processes at the same place it does not make
    161       1.10      mrg  *    sense to flush these entries when switching from one process'
    162       1.10      mrg  *    pmap to another.
    163       1.10      mrg  */
    164       1.10      mrg 
    165       1.11  thorpej #if !defined(_LOCORE)
    166       1.10      mrg 
    167       1.10      mrg /*
    168       1.10      mrg  * here we define the data types for PDEs and PTEs
    169       1.10      mrg  */
    170       1.10      mrg 
    171       1.15    perry typedef uint32_t pd_entry_t;		/* PDE */
    172       1.15    perry typedef uint32_t pt_entry_t;		/* PTE */
    173       1.10      mrg 
    174        1.1      cgd #endif
    175        1.1      cgd 
    176       1.10      mrg /*
    177       1.10      mrg  * now we define various for playing with virtual addresses
    178       1.10      mrg  */
    179       1.10      mrg 
    180  1.15.48.1    joerg #define L1_SHIFT	12
    181  1.15.48.1    joerg #define	L2_SHIFT	22
    182  1.15.48.1    joerg #define	NBPD_L1		(1ULL << L1_SHIFT) /* # bytes mapped by L1 ent (4K) */
    183  1.15.48.1    joerg #define	NBPD_L2		(1ULL << L2_SHIFT) /* # bytes mapped by L2 ent (4MB) */
    184  1.15.48.1    joerg 
    185  1.15.48.1    joerg #define L2_MASK		0xffc00000
    186  1.15.48.1    joerg #define L1_MASK		0x003ff000
    187  1.15.48.1    joerg 
    188  1.15.48.1    joerg #define L2_FRAME	(L2_MASK)
    189  1.15.48.1    joerg #define L1_FRAME	(L2_FRAME|L1_MASK)
    190        1.1      cgd 
    191       1.10      mrg /*
    192       1.10      mrg  * here we define the bits of the PDE/PTE, as described above:
    193       1.10      mrg  *
    194       1.10      mrg  * XXXCDC: need to rename these (PG_u == ugly).
    195       1.10      mrg  */
    196       1.10      mrg 
    197       1.10      mrg #define	PG_V		0x00000001	/* valid entry */
    198       1.10      mrg #define	PG_RO		0x00000000	/* read-only page */
    199       1.10      mrg #define	PG_RW		0x00000002	/* read-write page */
    200       1.10      mrg #define	PG_u		0x00000004	/* user accessible page */
    201       1.14      chs #define	PG_PROT		0x00000806	/* all protection bits */
    202        1.4  mycroft #define	PG_N		0x00000018	/* non-cacheable */
    203        1.4  mycroft #define	PG_U		0x00000020	/* has been used */
    204        1.4  mycroft #define	PG_M		0x00000040	/* has been modified */
    205       1.10      mrg #define PG_PS		0x00000080	/* 4MB page size */
    206       1.10      mrg #define PG_G		0x00000100	/* global, don't TLB flush */
    207       1.10      mrg #define PG_AVAIL1	0x00000200	/* ignored by hardware */
    208       1.10      mrg #define PG_AVAIL2	0x00000400	/* ignored by hardware */
    209       1.10      mrg #define PG_AVAIL3	0x00000800	/* ignored by hardware */
    210        1.4  mycroft #define	PG_FRAME	0xfffff000	/* page frame mask */
    211       1.12  thorpej 
    212       1.12  thorpej #define	PG_LGFRAME	0xffc00000	/* large (4MB) page frame mask */
    213        1.1      cgd 
    214       1.10      mrg /*
    215       1.10      mrg  * various short-hand protection codes
    216       1.10      mrg  */
    217       1.10      mrg 
    218       1.10      mrg #define	PG_KR		0x00000000	/* kernel read-only */
    219       1.10      mrg #define	PG_KW		0x00000002	/* kernel read-write */
    220  1.15.48.1    joerg #define	PG_NX		0		/* dummy */
    221       1.10      mrg 
    222       1.10      mrg /*
    223       1.10      mrg  * page protection exception bits
    224       1.10      mrg  */
    225       1.10      mrg 
    226       1.10      mrg #define PGEX_P		0x01	/* protection violation (vs. no mapping) */
    227       1.10      mrg #define PGEX_W		0x02	/* exception during a write cycle */
    228       1.10      mrg #define PGEX_U		0x04	/* exception while in user mode (upl) */
    229        1.3   andrew 
    230        1.3   andrew #endif /* _I386_PTE_H_ */
    231