booke_pmap.c revision 1.10 1 1.10 jym /* $NetBSD: booke_pmap.c,v 1.10 2011/09/27 01:02:35 jym Exp $ */
2 1.2 matt /*-
3 1.2 matt * Copyright (c) 2010, 2011 The NetBSD Foundation, Inc.
4 1.2 matt * All rights reserved.
5 1.2 matt *
6 1.2 matt * This code is derived from software contributed to The NetBSD Foundation
7 1.2 matt * by Raytheon BBN Technologies Corp and Defense Advanced Research Projects
8 1.2 matt * Agency and which was developed by Matt Thomas of 3am Software Foundry.
9 1.2 matt *
10 1.2 matt * This material is based upon work supported by the Defense Advanced Research
11 1.2 matt * Projects Agency and Space and Naval Warfare Systems Center, Pacific, under
12 1.2 matt * Contract No. N66001-09-C-2073.
13 1.2 matt * Approved for Public Release, Distribution Unlimited
14 1.2 matt *
15 1.2 matt * Redistribution and use in source and binary forms, with or without
16 1.2 matt * modification, are permitted provided that the following conditions
17 1.2 matt * are met:
18 1.2 matt * 1. Redistributions of source code must retain the above copyright
19 1.2 matt * notice, this list of conditions and the following disclaimer.
20 1.2 matt * 2. Redistributions in binary form must reproduce the above copyright
21 1.2 matt * notice, this list of conditions and the following disclaimer in the
22 1.2 matt * documentation and/or other materials provided with the distribution.
23 1.2 matt *
24 1.2 matt * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
25 1.2 matt * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
26 1.2 matt * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
27 1.2 matt * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
28 1.2 matt * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
29 1.2 matt * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
30 1.2 matt * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
31 1.2 matt * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
32 1.2 matt * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
33 1.2 matt * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
34 1.2 matt * POSSIBILITY OF SUCH DAMAGE.
35 1.2 matt */
36 1.2 matt
37 1.4 matt #define __PMAP_PRIVATE
38 1.3 matt
39 1.2 matt #include <sys/cdefs.h>
40 1.2 matt
41 1.10 jym __KERNEL_RCSID(0, "$NetBSD: booke_pmap.c,v 1.10 2011/09/27 01:02:35 jym Exp $");
42 1.2 matt
43 1.2 matt #include <sys/param.h>
44 1.2 matt #include <sys/kcore.h>
45 1.2 matt #include <sys/buf.h>
46 1.2 matt
47 1.6 matt #include <uvm/uvm.h>
48 1.2 matt
49 1.2 matt #include <machine/pmap.h>
50 1.2 matt
51 1.2 matt /*
52 1.2 matt * Initialize the kernel pmap.
53 1.2 matt */
54 1.2 matt #ifdef MULTIPROCESSOR
55 1.2 matt #define PMAP_SIZE offsetof(struct pmap, pm_pai[MAXCPUS])
56 1.2 matt #else
57 1.2 matt #define PMAP_SIZE sizeof(struct pmap)
58 1.2 matt #endif
59 1.2 matt
60 1.2 matt CTASSERT(sizeof(struct pmap_segtab) == NBPG);
61 1.2 matt
62 1.2 matt void
63 1.2 matt pmap_procwr(struct proc *p, vaddr_t va, size_t len)
64 1.2 matt {
65 1.2 matt struct pmap * const pmap = p->p_vmspace->vm_map.pmap;
66 1.2 matt vsize_t off = va & PAGE_SIZE;
67 1.2 matt
68 1.2 matt kpreempt_disable();
69 1.2 matt for (const vaddr_t eva = va + len; va < eva; off = 0) {
70 1.2 matt const vaddr_t segeva = min(va + len, va - off + PAGE_SIZE);
71 1.2 matt pt_entry_t * const ptep = pmap_pte_lookup(pmap, va);
72 1.2 matt if (ptep == NULL) {
73 1.2 matt va = segeva;
74 1.2 matt continue;
75 1.2 matt }
76 1.2 matt pt_entry_t pt_entry = *ptep;
77 1.2 matt if (!pte_valid_p(pt_entry) || !pte_exec_p(pt_entry)) {
78 1.2 matt va = segeva;
79 1.2 matt continue;
80 1.2 matt }
81 1.2 matt kpreempt_enable();
82 1.2 matt dcache_wb(pte_to_paddr(pt_entry), segeva - va);
83 1.2 matt icache_inv(pte_to_paddr(pt_entry), segeva - va);
84 1.2 matt kpreempt_disable();
85 1.2 matt va = segeva;
86 1.2 matt }
87 1.2 matt kpreempt_enable();
88 1.2 matt }
89 1.2 matt
90 1.2 matt void
91 1.4 matt pmap_md_page_syncicache(struct vm_page *pg, __cpuset_t onproc)
92 1.2 matt {
93 1.4 matt /*
94 1.4 matt * If onproc is empty, we could do a
95 1.4 matt * pmap_page_protect(pg, VM_PROT_NONE) and remove all
96 1.4 matt * mappings of the page and clear its execness. Then
97 1.4 matt * the next time page is faulted, it will get icache
98 1.4 matt * synched. But this is easier. :)
99 1.4 matt */
100 1.2 matt paddr_t pa = VM_PAGE_TO_PHYS(pg);
101 1.2 matt dcache_wb_page(pa);
102 1.2 matt icache_inv_page(pa);
103 1.2 matt }
104 1.2 matt
105 1.2 matt vaddr_t
106 1.2 matt pmap_md_direct_map_paddr(paddr_t pa)
107 1.2 matt {
108 1.2 matt return (vaddr_t) pa;
109 1.2 matt }
110 1.2 matt
111 1.2 matt bool
112 1.2 matt pmap_md_direct_mapped_vaddr_p(vaddr_t va)
113 1.2 matt {
114 1.2 matt return va < VM_MIN_KERNEL_ADDRESS || VM_MAX_KERNEL_ADDRESS <= va;
115 1.2 matt }
116 1.2 matt
117 1.2 matt paddr_t
118 1.2 matt pmap_md_direct_mapped_vaddr_to_paddr(vaddr_t va)
119 1.2 matt {
120 1.2 matt return (paddr_t) va;
121 1.2 matt }
122 1.2 matt
123 1.2 matt /*
124 1.2 matt * Bootstrap the system enough to run with virtual memory.
125 1.2 matt * firstaddr is the first unused kseg0 address (not page aligned).
126 1.2 matt */
127 1.2 matt void
128 1.2 matt pmap_bootstrap(vaddr_t startkernel, vaddr_t endkernel,
129 1.2 matt const phys_ram_seg_t *avail, size_t cnt)
130 1.2 matt {
131 1.2 matt for (size_t i = 0; i < cnt; i++) {
132 1.2 matt printf(" uvm_page_physload(%#lx,%#lx,%#lx,%#lx,%d)",
133 1.2 matt atop(avail[i].start),
134 1.2 matt atop(avail[i].start + avail[i].size) - 1,
135 1.2 matt atop(avail[i].start),
136 1.2 matt atop(avail[i].start + avail[i].size) - 1,
137 1.2 matt VM_FREELIST_DEFAULT);
138 1.2 matt uvm_page_physload(
139 1.2 matt atop(avail[i].start),
140 1.2 matt atop(avail[i].start + avail[i].size) - 1,
141 1.2 matt atop(avail[i].start),
142 1.2 matt atop(avail[i].start + avail[i].size) - 1,
143 1.2 matt VM_FREELIST_DEFAULT);
144 1.2 matt }
145 1.2 matt
146 1.2 matt pmap_tlb_info_init(&pmap_tlb0_info); /* init the lock */
147 1.2 matt
148 1.2 matt /*
149 1.2 matt * Compute the number of pages kmem_map will have.
150 1.2 matt */
151 1.2 matt kmeminit_nkmempages();
152 1.2 matt
153 1.2 matt /*
154 1.2 matt * Figure out how many PTE's are necessary to map the kernel.
155 1.2 matt * We also reserve space for kmem_alloc_pageable() for vm_fork().
156 1.2 matt */
157 1.2 matt
158 1.2 matt /* Get size of buffer cache and set an upper limit */
159 1.2 matt buf_setvalimit((VM_MAX_KERNEL_ADDRESS - VM_MIN_KERNEL_ADDRESS) / 8);
160 1.2 matt vsize_t bufsz = buf_memcalc();
161 1.2 matt buf_setvalimit(bufsz);
162 1.2 matt
163 1.2 matt vsize_t nsegtabs = pmap_round_seg(VM_PHYS_SIZE
164 1.2 matt + (ubc_nwins << ubc_winshift)
165 1.2 matt + bufsz
166 1.2 matt + 16 * NCARGS
167 1.2 matt + pager_map_size
168 1.2 matt + maxproc * USPACE
169 1.2 matt #ifdef SYSVSHM
170 1.2 matt + NBPG * shminfo.shmall
171 1.2 matt #endif
172 1.2 matt + NBPG * nkmempages);
173 1.2 matt
174 1.2 matt /*
175 1.2 matt * Initialize `FYI' variables. Note we're relying on
176 1.2 matt * the fact that BSEARCH sorts the vm_physmem[] array
177 1.2 matt * for us. Must do this before uvm_pageboot_alloc()
178 1.2 matt * can be called.
179 1.2 matt */
180 1.2 matt pmap_limits.avail_start = vm_physmem[0].start << PGSHIFT;
181 1.2 matt pmap_limits.avail_end = vm_physmem[vm_nphysseg - 1].end << PGSHIFT;
182 1.2 matt const vsize_t max_nsegtabs =
183 1.2 matt (pmap_round_seg(VM_MAX_KERNEL_ADDRESS)
184 1.2 matt - pmap_trunc_seg(VM_MIN_KERNEL_ADDRESS)) / NBSEG;
185 1.2 matt if (nsegtabs >= max_nsegtabs) {
186 1.2 matt pmap_limits.virtual_end = VM_MAX_KERNEL_ADDRESS;
187 1.2 matt nsegtabs = max_nsegtabs;
188 1.2 matt } else {
189 1.2 matt pmap_limits.virtual_end = VM_MIN_KERNEL_ADDRESS
190 1.2 matt + nsegtabs * NBSEG;
191 1.2 matt }
192 1.2 matt
193 1.2 matt pmap_pvlist_lock_init(curcpu()->ci_ci.dcache_line_size);
194 1.2 matt
195 1.2 matt /*
196 1.2 matt * Now actually allocate the kernel PTE array (must be done
197 1.2 matt * after virtual_end is initialized).
198 1.2 matt */
199 1.2 matt vaddr_t segtabs =
200 1.2 matt uvm_pageboot_alloc(NBPG * nsegtabs + sizeof(struct pmap_segtab));
201 1.2 matt
202 1.2 matt /*
203 1.2 matt * Initialize the kernel's two-level page level. This only wastes
204 1.2 matt * an extra page for the segment table and allows the user/kernel
205 1.2 matt * access to be common.
206 1.2 matt */
207 1.2 matt struct pmap_segtab * const stp = (void *)segtabs;
208 1.2 matt segtabs += round_page(sizeof(struct pmap_segtab));
209 1.2 matt pt_entry_t **ptp = &stp->seg_tab[VM_MIN_KERNEL_ADDRESS >> SEGSHIFT];
210 1.2 matt for (u_int i = 0; i < nsegtabs; i++, segtabs += NBPG) {
211 1.2 matt *ptp++ = (void *)segtabs;
212 1.2 matt }
213 1.2 matt pmap_kernel()->pm_segtab = stp;
214 1.2 matt curcpu()->ci_pmap_kern_segtab = stp;
215 1.2 matt printf(" kern_segtab=%p", stp);
216 1.2 matt
217 1.2 matt #if 0
218 1.2 matt nsegtabs = (physmem + NPTEPG - 1) / NPTEPG;
219 1.2 matt segtabs = uvm_pageboot_alloc(NBPG * nsegtabs);
220 1.2 matt ptp = stp->seg_tab;
221 1.2 matt pt_entry_t pt_entry = PTE_M|PTE_xX|PTE_xR;
222 1.2 matt pt_entry_t *ptep = (void *)segtabs;
223 1.2 matt printf("%s: allocated %lu page table pages for mapping %u pages\n",
224 1.2 matt __func__, nsegtabs, physmem);
225 1.2 matt for (u_int i = 0; i < nsegtabs; i++, segtabs += NBPG, ptp++) {
226 1.2 matt *ptp = ptep;
227 1.2 matt for (u_int j = 0; j < NPTEPG; j++, ptep++) {
228 1.2 matt *ptep = pt_entry;
229 1.2 matt pt_entry += NBPG;
230 1.2 matt }
231 1.2 matt printf(" [%u]=%p (%#x)", i, *ptp, **ptp);
232 1.2 matt pt_entry |= PTE_xW;
233 1.2 matt pt_entry &= ~PTE_xX;
234 1.2 matt }
235 1.2 matt
236 1.2 matt /*
237 1.2 matt * Now make everything before the kernel inaccessible.
238 1.2 matt */
239 1.2 matt for (u_int i = 0; i < startkernel / NBPG; i += NBPG) {
240 1.2 matt stp->seg_tab[i >> SEGSHIFT][(i & SEGOFSET) >> PAGE_SHIFT] = 0;
241 1.2 matt }
242 1.2 matt #endif
243 1.2 matt
244 1.2 matt /*
245 1.2 matt * Initialize the pools.
246 1.2 matt */
247 1.2 matt pool_init(&pmap_pmap_pool, PMAP_SIZE, 0, 0, 0, "pmappl",
248 1.2 matt &pool_allocator_nointr, IPL_NONE);
249 1.2 matt pool_init(&pmap_pv_pool, sizeof(struct pv_entry), 0, 0, 0, "pvpl",
250 1.2 matt &pmap_pv_page_allocator, IPL_NONE);
251 1.2 matt
252 1.2 matt tlb_set_asid(0);
253 1.2 matt }
254 1.2 matt
255 1.2 matt struct vm_page *
256 1.2 matt pmap_md_alloc_poolpage(int flags)
257 1.2 matt {
258 1.2 matt /*
259 1.2 matt * Any managed page works for us.
260 1.2 matt */
261 1.2 matt return uvm_pagealloc(NULL, 0, NULL, flags);
262 1.2 matt }
263 1.2 matt
264 1.2 matt void
265 1.2 matt pmap_zero_page(paddr_t pa)
266 1.2 matt {
267 1.2 matt dcache_zero_page(pa);
268 1.5 matt
269 1.6 matt KASSERT(!VM_PAGEMD_EXECPAGE_P(VM_PAGE_TO_MD(PHYS_TO_VM_PAGE(pa))));
270 1.2 matt }
271 1.2 matt
272 1.2 matt void
273 1.2 matt pmap_copy_page(paddr_t src, paddr_t dst)
274 1.2 matt {
275 1.2 matt const size_t line_size = curcpu()->ci_ci.dcache_line_size;
276 1.2 matt const paddr_t end = src + PAGE_SIZE;
277 1.2 matt
278 1.2 matt while (src < end) {
279 1.2 matt __asm(
280 1.2 matt "dcbt %2,%1" "\n\t" /* touch next src cachline */
281 1.2 matt "dcba 0,%1" "\n\t" /* don't fetch dst cacheline */
282 1.2 matt :: "b"(src), "b"(dst), "b"(line_size));
283 1.2 matt for (u_int i = 0;
284 1.2 matt i < line_size;
285 1.2 matt src += 32, dst += 32, i += 32) {
286 1.2 matt __asm(
287 1.2 matt "lmw 24,0(%0)" "\n\t"
288 1.2 matt "stmw 24,0(%1)"
289 1.2 matt :: "b"(src), "b"(dst)
290 1.2 matt : "r24", "r25", "r26", "r27",
291 1.2 matt "r28", "r29", "r30", "r31");
292 1.2 matt }
293 1.2 matt }
294 1.5 matt
295 1.6 matt KASSERT(!VM_PAGEMD_EXECPAGE_P(VM_PAGE_TO_MD(PHYS_TO_VM_PAGE(dst - PAGE_SIZE))));
296 1.2 matt }
297 1.2 matt
298 1.2 matt void
299 1.2 matt pmap_md_init(void)
300 1.2 matt {
301 1.2 matt
302 1.2 matt /* nothing for now */
303 1.2 matt }
304 1.2 matt
305 1.2 matt bool
306 1.2 matt pmap_md_io_vaddr_p(vaddr_t va)
307 1.2 matt {
308 1.2 matt return va >= pmap_limits.avail_end
309 1.2 matt && !(VM_MIN_KERNEL_ADDRESS <= va && va < VM_MAX_KERNEL_ADDRESS);
310 1.2 matt }
311 1.2 matt
312 1.7 matt bool
313 1.7 matt pmap_md_tlb_check_entry(void *ctx, vaddr_t va, tlb_asid_t asid, pt_entry_t pte)
314 1.7 matt {
315 1.7 matt pmap_t pm = ctx;
316 1.7 matt struct pmap_asid_info * const pai = PMAP_PAI(pm, curcpu()->ci_tlb_info);
317 1.7 matt
318 1.7 matt if (asid != pai->pai_asid)
319 1.7 matt return true;
320 1.7 matt
321 1.7 matt const pt_entry_t * const ptep = pmap_pte_lookup(pm, va);
322 1.7 matt KASSERT(ptep != NULL);
323 1.7 matt pt_entry_t xpte = *ptep;
324 1.7 matt xpte &= ~((xpte & (PTE_UNSYNCED|PTE_UNMODIFIED)) << 1);
325 1.7 matt xpte ^= xpte & (PTE_UNSYNCED|PTE_UNMODIFIED|PTE_WIRED);
326 1.7 matt
327 1.7 matt KASSERTMSG(pte == xpte,
328 1.10 jym "pm=%p va=%#"PRIxVADDR" asid=%u: TLB pte (%#x) != real pte (%#x/%#x)",
329 1.10 jym pm, va, asid, pte, xpte, *ptep);
330 1.7 matt
331 1.7 matt return true;
332 1.7 matt }
333 1.8 matt
334 1.8 matt #ifdef MULTIPROCESSOR
335 1.8 matt void
336 1.8 matt pmap_md_tlb_info_attach(struct pmap_tlb_info *ti, struct cpu_info *ci)
337 1.8 matt {
338 1.8 matt /* nothing */
339 1.8 matt }
340 1.8 matt #endif /* MULTIPROCESSOR */
341