pmap.h revision 1.15
1/* $NetBSD: pmap.h,v 1.15 2007/11/22 16:16:45 bouyer Exp $ */ 2 3/* 4 * 5 * Copyright (c) 1997 Charles D. Cranor and Washington University. 6 * All rights reserved. 7 * 8 * Redistribution and use in source and binary forms, with or without 9 * modification, are permitted provided that the following conditions 10 * are met: 11 * 1. Redistributions of source code must retain the above copyright 12 * notice, this list of conditions and the following disclaimer. 13 * 2. Redistributions in binary form must reproduce the above copyright 14 * notice, this list of conditions and the following disclaimer in the 15 * documentation and/or other materials provided with the distribution. 16 * 3. All advertising materials mentioning features or use of this software 17 * must display the following acknowledgment: 18 * This product includes software developed by Charles D. Cranor and 19 * Washington University. 20 * 4. The name of the author may not be used to endorse or promote products 21 * derived from this software without specific prior written permission. 22 * 23 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR 24 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES 25 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. 26 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, 27 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT 28 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 29 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 30 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 31 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF 32 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 33 */ 34 35/* 36 * Copyright (c) 2001 Wasabi Systems, Inc. 37 * All rights reserved. 38 * 39 * Written by Frank van der Linden for Wasabi Systems, Inc. 40 * 41 * Redistribution and use in source and binary forms, with or without 42 * modification, are permitted provided that the following conditions 43 * are met: 44 * 1. Redistributions of source code must retain the above copyright 45 * notice, this list of conditions and the following disclaimer. 46 * 2. Redistributions in binary form must reproduce the above copyright 47 * notice, this list of conditions and the following disclaimer in the 48 * documentation and/or other materials provided with the distribution. 49 * 3. All advertising materials mentioning features or use of this software 50 * must display the following acknowledgement: 51 * This product includes software developed for the NetBSD Project by 52 * Wasabi Systems, Inc. 53 * 4. The name of Wasabi Systems, Inc. may not be used to endorse 54 * or promote products derived from this software without specific prior 55 * written permission. 56 * 57 * THIS SOFTWARE IS PROVIDED BY WASABI SYSTEMS, INC. ``AS IS'' AND 58 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED 59 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR 60 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL WASABI SYSTEMS, INC 61 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR 62 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF 63 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS 64 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN 65 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) 66 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE 67 * POSSIBILITY OF SUCH DAMAGE. 68 */ 69 70#ifndef _AMD64_PMAP_H_ 71#define _AMD64_PMAP_H_ 72 73#if defined(_KERNEL_OPT) 74#include "opt_xen.h" 75#endif 76 77#include <machine/pte.h> 78#include <machine/segments.h> 79#include <machine/atomic.h> 80#ifdef _KERNEL 81#include <machine/cpufunc.h> 82#endif 83 84#include <uvm/uvm_object.h> 85#ifdef XEN 86#include <xen/xenfunc.h> 87#include <xen/xenpmap.h> 88#endif /* XEN */ 89 90/* 91 * The x86_64 pmap module closely resembles the i386 one. It uses 92 * the same recursive entry scheme, and the same alternate area 93 * trick for accessing non-current pmaps. See the i386 pmap.h 94 * for a description. The obvious difference is that 3 extra 95 * levels of page table need to be dealt with. The level 1 page 96 * table pages are at: 97 * 98 * l1: 0x00007f8000000000 - 0x00007fffffffffff (39 bits, needs PML4 entry) 99 * 100 * The alternate space is at: 101 * 102 * l1: 0xffffff8000000000 - 0xffffffffffffffff (39 bits, needs PML4 entry) 103 * 104 * The rest is kept as physical pages in 3 UVM objects, and is 105 * temporarily mapped for virtual access when needed. 106 * 107 * Note that address space is signed, so the layout for 48 bits is: 108 * 109 * +---------------------------------+ 0xffffffffffffffff 110 * | | 111 * | alt.L1 table (PTE pages) | 112 * | | 113 * +---------------------------------+ 0xffffff8000000000 114 * ~ ~ 115 * | | 116 * | Kernel Space | 117 * | | 118 * | | 119 * +---------------------------------+ 0xffff800000000000 = 0x0000800000000000 120 * | | 121 * | alt.L1 table (PTE pages) | 122 * | | 123 * +---------------------------------+ 0x00007f8000000000 124 * ~ ~ 125 * | | 126 * | User Space | 127 * | | 128 * | | 129 * +---------------------------------+ 0x0000000000000000 130 * 131 * In other words, there is a 'VA hole' at 0x0000800000000000 - 132 * 0xffff800000000000 which will trap, just as on, for example, 133 * sparcv9. 134 * 135 * The unused space can be used if needed, but it adds a little more 136 * complexity to the calculations. 137 */ 138 139/* 140 * The first generation of Hammer processors can use 48 bits of 141 * virtual memory, and 40 bits of physical memory. This will be 142 * more for later generations. These defines can be changed to 143 * variable names containing the # of bits, extracted from an 144 * extended cpuid instruction (variables are harder to use during 145 * bootstrap, though) 146 */ 147#define VIRT_BITS 48 148#define PHYS_BITS 40 149 150/* 151 * Mask to get rid of the sign-extended part of addresses. 152 */ 153#define VA_SIGN_MASK 0xffff000000000000 154#define VA_SIGN_NEG(va) ((va) | VA_SIGN_MASK) 155/* 156 * XXXfvdl this one's not right. 157 */ 158#define VA_SIGN_POS(va) ((va) & ~VA_SIGN_MASK) 159 160#define L4_SLOT_PTE 255 161#ifndef XEN 162#define L4_SLOT_KERN 256 163#else 164/* Xen use slots 256-272, let's move farther */ 165#define L4_SLOT_KERN 320 166#endif 167#define L4_SLOT_KERNBASE 511 168#define L4_SLOT_APTE 510 169 170#define PDIR_SLOT_KERN L4_SLOT_KERN 171#define PDIR_SLOT_PTE L4_SLOT_PTE 172#define PDIR_SLOT_APTE L4_SLOT_APTE 173 174/* 175 * the following defines give the virtual addresses of various MMU 176 * data structures: 177 * PTE_BASE and APTE_BASE: the base VA of the linear PTE mappings 178 * PTD_BASE and APTD_BASE: the base VA of the recursive mapping of the PTD 179 * PDP_PDE and APDP_PDE: the VA of the PDE that points back to the PDP/APDP 180 * 181 */ 182 183#define PTE_BASE ((pt_entry_t *) (L4_SLOT_PTE * NBPD_L4)) 184#define APTE_BASE ((pt_entry_t *) (VA_SIGN_NEG((L4_SLOT_APTE * NBPD_L4)))) 185 186#define L1_BASE PTE_BASE 187#define AL1_BASE APTE_BASE 188 189#define L2_BASE ((pd_entry_t *)((char *)L1_BASE + L4_SLOT_PTE * NBPD_L3)) 190#define L3_BASE ((pd_entry_t *)((char *)L2_BASE + L4_SLOT_PTE * NBPD_L2)) 191#define L4_BASE ((pd_entry_t *)((char *)L3_BASE + L4_SLOT_PTE * NBPD_L1)) 192 193#define AL2_BASE ((pd_entry_t *)((char *)AL1_BASE + L4_SLOT_PTE * NBPD_L3)) 194#define AL3_BASE ((pd_entry_t *)((char *)AL2_BASE + L4_SLOT_PTE * NBPD_L2)) 195#define AL4_BASE ((pd_entry_t *)((char *)AL3_BASE + L4_SLOT_PTE * NBPD_L1)) 196 197#define PDP_PDE (L4_BASE + PDIR_SLOT_PTE) 198#define APDP_PDE (L4_BASE + PDIR_SLOT_APTE) 199 200#define PDP_BASE L4_BASE 201#define APDP_BASE AL4_BASE 202 203#define NKL4_MAX_ENTRIES (unsigned long)1 204#define NKL3_MAX_ENTRIES (unsigned long)(NKL4_MAX_ENTRIES * 512) 205#define NKL2_MAX_ENTRIES (unsigned long)(NKL3_MAX_ENTRIES * 512) 206#define NKL1_MAX_ENTRIES (unsigned long)(NKL2_MAX_ENTRIES * 512) 207 208#define NKL4_KIMG_ENTRIES 1 209#define NKL3_KIMG_ENTRIES 1 210#define NKL2_KIMG_ENTRIES 8 211 212/* 213 * Since kva space is below the kernel in its entirety, we start off 214 * with zero entries on each level. 215 */ 216#define NKL4_START_ENTRIES 0 217#define NKL3_START_ENTRIES 0 218#define NKL2_START_ENTRIES 0 219#define NKL1_START_ENTRIES 0 /* XXX */ 220 221#define NTOPLEVEL_PDES (PAGE_SIZE / (sizeof (pd_entry_t))) 222 223#define NPDPG (PAGE_SIZE / sizeof (pd_entry_t)) 224 225#define PTP_MASK_INITIALIZER { L1_FRAME, L2_FRAME, L3_FRAME, L4_FRAME } 226#define PTP_SHIFT_INITIALIZER { L1_SHIFT, L2_SHIFT, L3_SHIFT, L4_SHIFT } 227#define NKPTP_INITIALIZER { NKL1_START_ENTRIES, NKL2_START_ENTRIES, \ 228 NKL3_START_ENTRIES, NKL4_START_ENTRIES } 229#define NKPTPMAX_INITIALIZER { NKL1_MAX_ENTRIES, NKL2_MAX_ENTRIES, \ 230 NKL3_MAX_ENTRIES, NKL4_MAX_ENTRIES } 231#define NBPD_INITIALIZER { NBPD_L1, NBPD_L2, NBPD_L3, NBPD_L4 } 232#define PDES_INITIALIZER { L2_BASE, L3_BASE, L4_BASE } 233#define APDES_INITIALIZER { AL2_BASE, AL3_BASE, AL4_BASE } 234 235#define PTP_LEVELS 4 236 237/* 238 * PG_AVAIL usage: we make use of the ignored bits of the PTE 239 */ 240 241#define PG_W PG_AVAIL1 /* "wired" mapping */ 242#define PG_PVLIST PG_AVAIL2 /* mapping has entry on pvlist */ 243/* PG_AVAIL3 not used */ 244 245#define PG_X 0 /* XXX dummy */ 246 247/* 248 * Number of PTE's per cache line. 8 byte pte, 64-byte cache line 249 * Used to avoid false sharing of cache lines. 250 */ 251#define NPTECL 8 252 253#include <x86/pmap.h> 254 255#ifndef XEN 256#define pmap_pa2pte(a) (a) 257#define pmap_pte2pa(a) ((a) & PG_FRAME) 258#define pmap_pte_set(p, n) do { *(p) = (n); } while (0) 259#define pmap_pte_testset(p, n) x86_atomic_testset_u64(p, n) 260#define pmap_pte_setbits(p, b) x86_atomic_setbits_u64(p, b) 261#define pmap_pte_clearbits(p, b) x86_atomic_clearbits_u64(p, b) 262#define pmap_pte_flush() /* nothing */ 263#define pmap_cpu_has_pg_n() (1) 264#define pmap_cpu_has_invlpg (1) 265#else 266static __inline pt_entry_t 267pmap_pa2pte(paddr_t pa) 268{ 269 return (pt_entry_t)xpmap_ptom_masked(pa); 270} 271 272static __inline paddr_t 273pmap_pte2pa(pt_entry_t pte) 274{ 275 return xpmap_mtop_masked(pte & PG_FRAME); 276} 277static __inline void 278pmap_pte_set(pt_entry_t *pte, pt_entry_t npte) 279{ 280 int s = splvm(); 281 xpq_queue_pte_update((pt_entry_t *)xpmap_ptetomach(pte), npte); 282 splx(s); 283} 284 285static __inline pt_entry_t 286pmap_pte_testset(volatile pt_entry_t *pte, pt_entry_t npte) 287{ 288 int s = splvm(); 289 pt_entry_t opte = *pte; 290 xpq_queue_pte_update((pt_entry_t *)xpmap_ptetomach(__UNVOLATILE(pte)), 291 npte); 292 xpq_flush_queue(); 293 splx(s); 294 return opte; 295} 296 297static __inline void 298pmap_pte_setbits(volatile pt_entry_t *pte, pt_entry_t bits) 299{ 300 int s = splvm(); 301 xpq_queue_pte_update((pt_entry_t *)xpmap_ptetomach(__UNVOLATILE(pte)), 302 (*pte) | bits); 303 xpq_flush_queue(); 304 splx(s); 305} 306 307static __inline void 308pmap_pte_clearbits(volatile pt_entry_t *pte, pt_entry_t bits) 309{ 310 int s = splvm(); 311 xpq_queue_pte_update((pt_entry_t *)xpmap_ptetomach(__UNVOLATILE(pte)), 312 (*pte) & ~bits); 313 xpq_flush_queue(); 314 splx(s); 315} 316 317#define pmap_cpu_has_pg_n() (1) 318#define pmap_cpu_has_invlpg (1) 319static __inline void 320pmap_pte_flush(void) 321{ 322 int s = splvm(); 323 xpq_flush_queue(); 324 splx(s); 325} 326#endif 327 328void pmap_prealloc_lowmem_ptps(void); 329void pmap_changeprot_local(vaddr_t, vm_prot_t); 330 331#endif /* _AMD64_PMAP_H_ */ 332