uvm_device.c revision 1.73 1 1.73 riastrad /* $NetBSD: uvm_device.c,v 1.73 2022/03/28 12:39:18 riastradh Exp $ */
2 1.4 mrg
3 1.1 mrg /*
4 1.1 mrg * Copyright (c) 1997 Charles D. Cranor and Washington University.
5 1.1 mrg * All rights reserved.
6 1.1 mrg *
7 1.1 mrg * Redistribution and use in source and binary forms, with or without
8 1.1 mrg * modification, are permitted provided that the following conditions
9 1.1 mrg * are met:
10 1.1 mrg * 1. Redistributions of source code must retain the above copyright
11 1.1 mrg * notice, this list of conditions and the following disclaimer.
12 1.1 mrg * 2. Redistributions in binary form must reproduce the above copyright
13 1.1 mrg * notice, this list of conditions and the following disclaimer in the
14 1.1 mrg * documentation and/or other materials provided with the distribution.
15 1.1 mrg *
16 1.1 mrg * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
17 1.1 mrg * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
18 1.1 mrg * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
19 1.1 mrg * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
20 1.1 mrg * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
21 1.1 mrg * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
22 1.1 mrg * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
23 1.1 mrg * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
24 1.1 mrg * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
25 1.1 mrg * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26 1.4 mrg *
27 1.4 mrg * from: Id: uvm_device.c,v 1.1.2.9 1998/02/06 05:11:47 chs Exp
28 1.1 mrg */
29 1.1 mrg
30 1.1 mrg /*
31 1.1 mrg * uvm_device.c: the device pager.
32 1.1 mrg */
33 1.39 lukem
34 1.39 lukem #include <sys/cdefs.h>
35 1.73 riastrad __KERNEL_RCSID(0, "$NetBSD: uvm_device.c,v 1.73 2022/03/28 12:39:18 riastradh Exp $");
36 1.39 lukem
37 1.39 lukem #include "opt_uvmhist.h"
38 1.1 mrg
39 1.1 mrg #include <sys/param.h>
40 1.1 mrg #include <sys/systm.h>
41 1.1 mrg #include <sys/conf.h>
42 1.1 mrg #include <sys/proc.h>
43 1.63 para #include <sys/kmem.h>
44 1.1 mrg
45 1.1 mrg #include <uvm/uvm.h>
46 1.1 mrg #include <uvm/uvm_device.h>
47 1.60 jmcneill #include <uvm/uvm_pmap.h>
48 1.1 mrg
49 1.1 mrg /*
50 1.1 mrg * private global data structure
51 1.1 mrg *
52 1.1 mrg * we keep a list of active device objects in the system.
53 1.1 mrg */
54 1.1 mrg
55 1.1 mrg LIST_HEAD(udv_list_struct, uvm_device);
56 1.1 mrg static struct udv_list_struct udv_list;
57 1.67 ad static kmutex_t udv_lock __cacheline_aligned;
58 1.1 mrg
59 1.1 mrg /*
60 1.1 mrg * functions
61 1.1 mrg */
62 1.1 mrg
63 1.42 junyoung static void udv_init(void);
64 1.42 junyoung static void udv_reference(struct uvm_object *);
65 1.42 junyoung static void udv_detach(struct uvm_object *);
66 1.42 junyoung static int udv_fault(struct uvm_faultinfo *, vaddr_t,
67 1.47 drochner struct vm_page **, int, int, vm_prot_t,
68 1.45 thorpej int);
69 1.1 mrg
70 1.1 mrg /*
71 1.1 mrg * master pager structure
72 1.1 mrg */
73 1.1 mrg
74 1.51 yamt const struct uvm_pagerops uvm_deviceops = {
75 1.48 christos .pgo_init = udv_init,
76 1.48 christos .pgo_reference = udv_reference,
77 1.48 christos .pgo_detach = udv_detach,
78 1.48 christos .pgo_fault = udv_fault,
79 1.1 mrg };
80 1.1 mrg
81 1.1 mrg /*
82 1.1 mrg * the ops!
83 1.1 mrg */
84 1.1 mrg
85 1.1 mrg /*
86 1.1 mrg * udv_init
87 1.1 mrg *
88 1.1 mrg * init pager private data structures.
89 1.1 mrg */
90 1.1 mrg
91 1.38 chs static void
92 1.38 chs udv_init(void)
93 1.7 mrg {
94 1.7 mrg LIST_INIT(&udv_list);
95 1.53 ad mutex_init(&udv_lock, MUTEX_DEFAULT, IPL_NONE);
96 1.1 mrg }
97 1.1 mrg
98 1.1 mrg /*
99 1.1 mrg * udv_attach
100 1.1 mrg *
101 1.1 mrg * get a VM object that is associated with a device. allocate a new
102 1.1 mrg * one if needed.
103 1.1 mrg *
104 1.1 mrg * => caller must _not_ already be holding the lock on the uvm_object.
105 1.1 mrg * => in fact, nothing should be locked so that we can sleep here.
106 1.1 mrg */
107 1.38 chs
108 1.7 mrg struct uvm_object *
109 1.64 chs udv_attach(dev_t device, vm_prot_t accessprot,
110 1.44 thorpej voff_t off, /* used only for access check */
111 1.44 thorpej vsize_t size /* used only for access check */)
112 1.1 mrg {
113 1.7 mrg struct uvm_device *udv, *lcv;
114 1.41 gehenna const struct cdevsw *cdev;
115 1.73 riastrad dev_mmap_t *mapfn;
116 1.40 christos
117 1.71 skrll UVMHIST_FUNC(__func__);
118 1.71 skrll UVMHIST_CALLARGS(maphist, "(device=%#jx)", device,0,0,0);
119 1.7 mrg
120 1.7 mrg /*
121 1.7 mrg * before we do anything, ensure this device supports mmap
122 1.7 mrg */
123 1.7 mrg
124 1.41 gehenna cdev = cdevsw_lookup(device);
125 1.52 ad if (cdev == NULL) {
126 1.41 gehenna return (NULL);
127 1.52 ad }
128 1.41 gehenna mapfn = cdev->d_mmap;
129 1.65 riastrad if (mapfn == NULL || mapfn == nommap) {
130 1.7 mrg return(NULL);
131 1.52 ad }
132 1.22 drochner
133 1.22 drochner /*
134 1.25 simonb * Negative offsets on the object are not allowed.
135 1.22 drochner */
136 1.30 chs
137 1.56 mrg if ((cdev->d_flag & D_NEGOFFSAFE) == 0 &&
138 1.56 mrg off != UVM_UNKNOWN_OFFSET && off < 0)
139 1.25 simonb return(NULL);
140 1.13 cgd
141 1.13 cgd /*
142 1.13 cgd * Check that the specified range of the device allows the
143 1.13 cgd * desired protection.
144 1.34 chs *
145 1.13 cgd * XXX assumes VM_PROT_* == PROT_*
146 1.13 cgd * XXX clobbers off and size, but nothing else here needs them.
147 1.13 cgd */
148 1.13 cgd
149 1.13 cgd while (size != 0) {
150 1.52 ad if (cdev_mmap(device, off, accessprot) == -1) {
151 1.13 cgd return (NULL);
152 1.52 ad }
153 1.16 drochner off += PAGE_SIZE; size -= PAGE_SIZE;
154 1.13 cgd }
155 1.7 mrg
156 1.7 mrg /*
157 1.7 mrg * keep looping until we get it
158 1.7 mrg */
159 1.7 mrg
160 1.30 chs for (;;) {
161 1.7 mrg
162 1.7 mrg /*
163 1.34 chs * first, attempt to find it on the main list
164 1.7 mrg */
165 1.7 mrg
166 1.53 ad mutex_enter(&udv_lock);
167 1.30 chs LIST_FOREACH(lcv, &udv_list, u_list) {
168 1.7 mrg if (device == lcv->u_device)
169 1.7 mrg break;
170 1.7 mrg }
171 1.7 mrg
172 1.7 mrg /*
173 1.7 mrg * got it on main list. put a hold on it and unlock udv_lock.
174 1.7 mrg */
175 1.7 mrg
176 1.7 mrg if (lcv) {
177 1.7 mrg
178 1.7 mrg /*
179 1.7 mrg * if someone else has a hold on it, sleep and start
180 1.7 mrg * over again.
181 1.7 mrg */
182 1.7 mrg
183 1.7 mrg if (lcv->u_flags & UVM_DEVICE_HOLD) {
184 1.7 mrg lcv->u_flags |= UVM_DEVICE_WANTED;
185 1.49 thorpej UVM_UNLOCK_AND_WAIT(lcv, &udv_lock, false,
186 1.7 mrg "udv_attach",0);
187 1.7 mrg continue;
188 1.7 mrg }
189 1.7 mrg
190 1.7 mrg /* we are now holding it */
191 1.7 mrg lcv->u_flags |= UVM_DEVICE_HOLD;
192 1.53 ad mutex_exit(&udv_lock);
193 1.7 mrg
194 1.7 mrg /*
195 1.7 mrg * bump reference count, unhold, return.
196 1.7 mrg */
197 1.7 mrg
198 1.69 ad rw_enter(lcv->u_obj.vmobjlock, RW_WRITER);
199 1.7 mrg lcv->u_obj.uo_refs++;
200 1.69 ad rw_exit(lcv->u_obj.vmobjlock);
201 1.30 chs
202 1.53 ad mutex_enter(&udv_lock);
203 1.7 mrg if (lcv->u_flags & UVM_DEVICE_WANTED)
204 1.7 mrg wakeup(lcv);
205 1.7 mrg lcv->u_flags &= ~(UVM_DEVICE_WANTED|UVM_DEVICE_HOLD);
206 1.53 ad mutex_exit(&udv_lock);
207 1.7 mrg return(&lcv->u_obj);
208 1.7 mrg }
209 1.7 mrg
210 1.7 mrg /*
211 1.61 rmind * Did not find it on main list. Need to allocate a new one.
212 1.7 mrg */
213 1.7 mrg
214 1.53 ad mutex_exit(&udv_lock);
215 1.62 rmind
216 1.62 rmind /* Note: both calls may allocate memory and sleep. */
217 1.63 para udv = kmem_alloc(sizeof(*udv), KM_SLEEP);
218 1.62 rmind uvm_obj_init(&udv->u_obj, &uvm_deviceops, true, 1);
219 1.62 rmind
220 1.53 ad mutex_enter(&udv_lock);
221 1.7 mrg
222 1.7 mrg /*
223 1.7 mrg * now we have to double check to make sure no one added it
224 1.7 mrg * to the list while we were sleeping...
225 1.7 mrg */
226 1.7 mrg
227 1.30 chs LIST_FOREACH(lcv, &udv_list, u_list) {
228 1.7 mrg if (device == lcv->u_device)
229 1.7 mrg break;
230 1.7 mrg }
231 1.7 mrg
232 1.7 mrg /*
233 1.30 chs * did we lose a race to someone else?
234 1.30 chs * free our memory and retry.
235 1.7 mrg */
236 1.7 mrg
237 1.7 mrg if (lcv) {
238 1.53 ad mutex_exit(&udv_lock);
239 1.62 rmind uvm_obj_destroy(&udv->u_obj, true);
240 1.63 para kmem_free(udv, sizeof(*udv));
241 1.7 mrg continue;
242 1.7 mrg }
243 1.7 mrg
244 1.7 mrg /*
245 1.7 mrg * we have it! init the data structures, add to list
246 1.7 mrg * and return.
247 1.7 mrg */
248 1.7 mrg
249 1.7 mrg udv->u_flags = 0;
250 1.7 mrg udv->u_device = device;
251 1.7 mrg LIST_INSERT_HEAD(&udv_list, udv, u_list);
252 1.53 ad mutex_exit(&udv_lock);
253 1.7 mrg return(&udv->u_obj);
254 1.30 chs }
255 1.7 mrg /*NOTREACHED*/
256 1.1 mrg }
257 1.34 chs
258 1.1 mrg /*
259 1.1 mrg * udv_reference
260 1.1 mrg *
261 1.1 mrg * add a reference to a VM object. Note that the reference count must
262 1.1 mrg * already be one (the passed in reference) so there is no chance of the
263 1.1 mrg * udv being released or locked out here.
264 1.1 mrg *
265 1.1 mrg * => caller must call with object unlocked.
266 1.1 mrg */
267 1.1 mrg
268 1.7 mrg static void
269 1.44 thorpej udv_reference(struct uvm_object *uobj)
270 1.1 mrg {
271 1.71 skrll UVMHIST_FUNC(__func__); UVMHIST_CALLED(maphist);
272 1.1 mrg
273 1.69 ad rw_enter(uobj->vmobjlock, RW_WRITER);
274 1.7 mrg uobj->uo_refs++;
275 1.70 rin UVMHIST_LOG(maphist, "<- done (uobj=%#jx, ref = %jd)",
276 1.66 pgoyette (uintptr_t)uobj, uobj->uo_refs,0,0);
277 1.69 ad rw_exit(uobj->vmobjlock);
278 1.1 mrg }
279 1.1 mrg
280 1.1 mrg /*
281 1.1 mrg * udv_detach
282 1.1 mrg *
283 1.1 mrg * remove a reference to a VM object.
284 1.1 mrg *
285 1.1 mrg * => caller must call with object unlocked and map locked.
286 1.1 mrg */
287 1.1 mrg
288 1.7 mrg static void
289 1.44 thorpej udv_detach(struct uvm_object *uobj)
290 1.1 mrg {
291 1.30 chs struct uvm_device *udv = (struct uvm_device *)uobj;
292 1.71 skrll UVMHIST_FUNC(__func__); UVMHIST_CALLED(maphist);
293 1.1 mrg
294 1.7 mrg /*
295 1.7 mrg * loop until done
296 1.7 mrg */
297 1.24 pk again:
298 1.69 ad rw_enter(uobj->vmobjlock, RW_WRITER);
299 1.24 pk if (uobj->uo_refs > 1) {
300 1.30 chs uobj->uo_refs--;
301 1.69 ad rw_exit(uobj->vmobjlock);
302 1.70 rin UVMHIST_LOG(maphist," <- done, uobj=%#jx, ref=%jd",
303 1.66 pgoyette (uintptr_t)uobj,uobj->uo_refs,0,0);
304 1.24 pk return;
305 1.24 pk }
306 1.1 mrg
307 1.24 pk /*
308 1.30 chs * is it being held? if so, wait until others are done.
309 1.24 pk */
310 1.30 chs
311 1.53 ad mutex_enter(&udv_lock);
312 1.24 pk if (udv->u_flags & UVM_DEVICE_HOLD) {
313 1.24 pk udv->u_flags |= UVM_DEVICE_WANTED;
314 1.69 ad rw_exit(uobj->vmobjlock);
315 1.49 thorpej UVM_UNLOCK_AND_WAIT(udv, &udv_lock, false, "udv_detach",0);
316 1.24 pk goto again;
317 1.24 pk }
318 1.1 mrg
319 1.24 pk /*
320 1.24 pk * got it! nuke it now.
321 1.24 pk */
322 1.30 chs
323 1.24 pk LIST_REMOVE(udv, u_list);
324 1.24 pk if (udv->u_flags & UVM_DEVICE_WANTED)
325 1.24 pk wakeup(udv);
326 1.53 ad mutex_exit(&udv_lock);
327 1.69 ad rw_exit(uobj->vmobjlock);
328 1.62 rmind
329 1.62 rmind uvm_obj_destroy(uobj, true);
330 1.63 para kmem_free(udv, sizeof(*udv));
331 1.70 rin UVMHIST_LOG(maphist," <- done, freed uobj=%#jx", (uintptr_t)uobj,
332 1.66 pgoyette 0, 0, 0);
333 1.1 mrg }
334 1.1 mrg
335 1.1 mrg /*
336 1.1 mrg * udv_fault: non-standard fault routine for device "pages"
337 1.1 mrg *
338 1.1 mrg * => rather than having a "get" function, we have a fault routine
339 1.1 mrg * since we don't return vm_pages we need full control over the
340 1.1 mrg * pmap_enter map in
341 1.1 mrg * => all the usual fault data structured are locked by the caller
342 1.1 mrg * (i.e. maps(read), amap (if any), uobj)
343 1.1 mrg * => on return, we unlock all fault data structures
344 1.1 mrg * => flags: PGO_ALLPAGES: get all of the pages
345 1.1 mrg * PGO_LOCKED: fault data structures are locked
346 1.1 mrg * XXX: currently PGO_LOCKED is always required ... consider removing
347 1.1 mrg * it as a flag
348 1.1 mrg * => NOTE: vaddr is the VA of pps[0] in ufi->entry, _NOT_ pps[centeridx]
349 1.1 mrg */
350 1.1 mrg
351 1.7 mrg static int
352 1.44 thorpej udv_fault(struct uvm_faultinfo *ufi, vaddr_t vaddr, struct vm_page **pps,
353 1.47 drochner int npages, int centeridx, vm_prot_t access_type,
354 1.44 thorpej int flags)
355 1.1 mrg {
356 1.7 mrg struct vm_map_entry *entry = ufi->entry;
357 1.7 mrg struct uvm_object *uobj = entry->object.uvm_obj;
358 1.7 mrg struct uvm_device *udv = (struct uvm_device *)uobj;
359 1.20 kleink vaddr_t curr_va;
360 1.27 simonb off_t curr_offset;
361 1.25 simonb paddr_t paddr, mdpgno;
362 1.59 jmcneill u_int mmapflags;
363 1.25 simonb int lcv, retval;
364 1.7 mrg dev_t device;
365 1.17 ross vm_prot_t mapprot;
366 1.71 skrll UVMHIST_FUNC(__func__); UVMHIST_CALLED(maphist);
367 1.72 skrll UVMHIST_LOG(maphist," flags=%#jx", flags,0,0,0);
368 1.7 mrg
369 1.7 mrg /*
370 1.7 mrg * we do not allow device mappings to be mapped copy-on-write
371 1.7 mrg * so we kill any attempt to do so here.
372 1.7 mrg */
373 1.34 chs
374 1.7 mrg if (UVM_ET_ISCOPYONWRITE(entry)) {
375 1.70 rin UVMHIST_LOG(maphist, "<- failed -- COW entry (etype=%#jx)",
376 1.66 pgoyette entry->etype, 0,0,0);
377 1.62 rmind uvmfault_unlockall(ufi, ufi->entry->aref.ar_amap, uobj);
378 1.31 chs return(EIO);
379 1.7 mrg }
380 1.7 mrg
381 1.7 mrg /*
382 1.34 chs * get device map function.
383 1.7 mrg */
384 1.30 chs
385 1.7 mrg device = udv->u_device;
386 1.52 ad if (cdevsw_lookup(device) == NULL) {
387 1.52 ad /* XXX This should not happen */
388 1.62 rmind uvmfault_unlockall(ufi, ufi->entry->aref.ar_amap, uobj);
389 1.41 gehenna return (EIO);
390 1.41 gehenna }
391 1.7 mrg
392 1.7 mrg /*
393 1.10 chuck * now we must determine the offset in udv to use and the VA to
394 1.10 chuck * use for pmap_enter. note that we always use orig_map's pmap
395 1.10 chuck * for pmap_enter (even if we have a submap). since virtual
396 1.10 chuck * addresses in a submap must match the main map, this is ok.
397 1.7 mrg */
398 1.30 chs
399 1.7 mrg /* udv offset = (offset from start of entry) + entry's offset */
400 1.27 simonb curr_offset = entry->offset + (vaddr - entry->start);
401 1.10 chuck /* pmap va = vaddr (virtual address of pps[0]) */
402 1.10 chuck curr_va = vaddr;
403 1.34 chs
404 1.7 mrg /*
405 1.7 mrg * loop over the page range entering in as needed
406 1.7 mrg */
407 1.7 mrg
408 1.31 chs retval = 0;
409 1.7 mrg for (lcv = 0 ; lcv < npages ; lcv++, curr_offset += PAGE_SIZE,
410 1.7 mrg curr_va += PAGE_SIZE) {
411 1.7 mrg if ((flags & PGO_ALLPAGES) == 0 && lcv != centeridx)
412 1.7 mrg continue;
413 1.7 mrg
414 1.7 mrg if (pps[lcv] == PGO_DONTCARE)
415 1.7 mrg continue;
416 1.7 mrg
417 1.52 ad mdpgno = cdev_mmap(device, curr_offset, access_type);
418 1.11 mrg if (mdpgno == -1) {
419 1.31 chs retval = EIO;
420 1.7 mrg break;
421 1.7 mrg }
422 1.11 mrg paddr = pmap_phys_address(mdpgno);
423 1.59 jmcneill mmapflags = pmap_mmap_flags(mdpgno);
424 1.17 ross mapprot = ufi->entry->protection;
425 1.7 mrg UVMHIST_LOG(maphist,
426 1.70 rin " MAPPING: device: pm=%#jx, va=%#jx, pa=%#jx, at=%jd",
427 1.66 pgoyette (uintptr_t)ufi->orig_map->pmap, curr_va, paddr, mapprot);
428 1.59 jmcneill if (pmap_enter(ufi->orig_map->pmap, curr_va, paddr, mapprot,
429 1.59 jmcneill PMAP_CANFAIL | mapprot | mmapflags) != 0) {
430 1.18 thorpej /*
431 1.18 thorpej * pmap_enter() didn't have the resource to
432 1.18 thorpej * enter this mapping. Unlock everything,
433 1.18 thorpej * wait for the pagedaemon to free up some
434 1.18 thorpej * pages, and then tell uvm_fault() to start
435 1.18 thorpej * the fault again.
436 1.18 thorpej *
437 1.18 thorpej * XXX Needs some rethinking for the PGO_ALLPAGES
438 1.18 thorpej * XXX case.
439 1.18 thorpej */
440 1.54 ad pmap_update(ufi->orig_map->pmap); /* sync what we have so far */
441 1.18 thorpej uvmfault_unlockall(ufi, ufi->entry->aref.ar_amap,
442 1.62 rmind uobj);
443 1.68 chs return ENOMEM;
444 1.18 thorpej }
445 1.7 mrg }
446 1.1 mrg
447 1.54 ad pmap_update(ufi->orig_map->pmap);
448 1.62 rmind uvmfault_unlockall(ufi, ufi->entry->aref.ar_amap, uobj);
449 1.18 thorpej return (retval);
450 1.1 mrg }
451