uvm_device.c revision 1.76 1 1.76 riastrad /* $NetBSD: uvm_device.c,v 1.76 2022/07/06 01:15:51 riastradh Exp $ */
2 1.4 mrg
3 1.1 mrg /*
4 1.1 mrg * Copyright (c) 1997 Charles D. Cranor and Washington University.
5 1.1 mrg * All rights reserved.
6 1.1 mrg *
7 1.1 mrg * Redistribution and use in source and binary forms, with or without
8 1.1 mrg * modification, are permitted provided that the following conditions
9 1.1 mrg * are met:
10 1.1 mrg * 1. Redistributions of source code must retain the above copyright
11 1.1 mrg * notice, this list of conditions and the following disclaimer.
12 1.1 mrg * 2. Redistributions in binary form must reproduce the above copyright
13 1.1 mrg * notice, this list of conditions and the following disclaimer in the
14 1.1 mrg * documentation and/or other materials provided with the distribution.
15 1.1 mrg *
16 1.1 mrg * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
17 1.1 mrg * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
18 1.1 mrg * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
19 1.1 mrg * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
20 1.1 mrg * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
21 1.1 mrg * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
22 1.1 mrg * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
23 1.1 mrg * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
24 1.1 mrg * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
25 1.1 mrg * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26 1.4 mrg *
27 1.4 mrg * from: Id: uvm_device.c,v 1.1.2.9 1998/02/06 05:11:47 chs Exp
28 1.1 mrg */
29 1.1 mrg
30 1.1 mrg /*
31 1.1 mrg * uvm_device.c: the device pager.
32 1.1 mrg */
33 1.39 lukem
34 1.39 lukem #include <sys/cdefs.h>
35 1.76 riastrad __KERNEL_RCSID(0, "$NetBSD: uvm_device.c,v 1.76 2022/07/06 01:15:51 riastradh Exp $");
36 1.39 lukem
37 1.39 lukem #include "opt_uvmhist.h"
38 1.1 mrg
39 1.1 mrg #include <sys/param.h>
40 1.1 mrg #include <sys/systm.h>
41 1.1 mrg #include <sys/conf.h>
42 1.1 mrg #include <sys/proc.h>
43 1.63 para #include <sys/kmem.h>
44 1.1 mrg
45 1.1 mrg #include <uvm/uvm.h>
46 1.1 mrg #include <uvm/uvm_device.h>
47 1.60 jmcneill #include <uvm/uvm_pmap.h>
48 1.1 mrg
49 1.1 mrg /*
50 1.1 mrg * private global data structure
51 1.1 mrg *
52 1.1 mrg * we keep a list of active device objects in the system.
53 1.1 mrg */
54 1.1 mrg
55 1.1 mrg LIST_HEAD(udv_list_struct, uvm_device);
56 1.1 mrg static struct udv_list_struct udv_list;
57 1.67 ad static kmutex_t udv_lock __cacheline_aligned;
58 1.1 mrg
59 1.1 mrg /*
60 1.1 mrg * functions
61 1.1 mrg */
62 1.1 mrg
63 1.42 junyoung static void udv_init(void);
64 1.42 junyoung static void udv_reference(struct uvm_object *);
65 1.42 junyoung static void udv_detach(struct uvm_object *);
66 1.42 junyoung static int udv_fault(struct uvm_faultinfo *, vaddr_t,
67 1.47 drochner struct vm_page **, int, int, vm_prot_t,
68 1.45 thorpej int);
69 1.1 mrg
70 1.1 mrg /*
71 1.1 mrg * master pager structure
72 1.1 mrg */
73 1.1 mrg
74 1.51 yamt const struct uvm_pagerops uvm_deviceops = {
75 1.48 christos .pgo_init = udv_init,
76 1.48 christos .pgo_reference = udv_reference,
77 1.48 christos .pgo_detach = udv_detach,
78 1.48 christos .pgo_fault = udv_fault,
79 1.1 mrg };
80 1.1 mrg
81 1.1 mrg /*
82 1.1 mrg * the ops!
83 1.1 mrg */
84 1.1 mrg
85 1.1 mrg /*
86 1.1 mrg * udv_init
87 1.1 mrg *
88 1.1 mrg * init pager private data structures.
89 1.1 mrg */
90 1.1 mrg
91 1.38 chs static void
92 1.38 chs udv_init(void)
93 1.7 mrg {
94 1.7 mrg LIST_INIT(&udv_list);
95 1.53 ad mutex_init(&udv_lock, MUTEX_DEFAULT, IPL_NONE);
96 1.1 mrg }
97 1.1 mrg
98 1.1 mrg /*
99 1.1 mrg * udv_attach
100 1.1 mrg *
101 1.1 mrg * get a VM object that is associated with a device. allocate a new
102 1.1 mrg * one if needed.
103 1.1 mrg *
104 1.1 mrg * => caller must _not_ already be holding the lock on the uvm_object.
105 1.1 mrg * => in fact, nothing should be locked so that we can sleep here.
106 1.1 mrg */
107 1.38 chs
108 1.7 mrg struct uvm_object *
109 1.64 chs udv_attach(dev_t device, vm_prot_t accessprot,
110 1.44 thorpej voff_t off, /* used only for access check */
111 1.44 thorpej vsize_t size /* used only for access check */)
112 1.1 mrg {
113 1.7 mrg struct uvm_device *udv, *lcv;
114 1.41 gehenna const struct cdevsw *cdev;
115 1.73 riastrad dev_mmap_t *mapfn;
116 1.40 christos
117 1.71 skrll UVMHIST_FUNC(__func__);
118 1.71 skrll UVMHIST_CALLARGS(maphist, "(device=%#jx)", device,0,0,0);
119 1.7 mrg
120 1.74 riastrad KASSERT(size > 0);
121 1.74 riastrad
122 1.7 mrg /*
123 1.7 mrg * before we do anything, ensure this device supports mmap
124 1.7 mrg */
125 1.7 mrg
126 1.41 gehenna cdev = cdevsw_lookup(device);
127 1.52 ad if (cdev == NULL) {
128 1.76 riastrad return NULL;
129 1.52 ad }
130 1.41 gehenna mapfn = cdev->d_mmap;
131 1.65 riastrad if (mapfn == NULL || mapfn == nommap) {
132 1.76 riastrad return NULL;
133 1.52 ad }
134 1.22 drochner
135 1.22 drochner /*
136 1.75 riastrad * Negative offsets on the object are not allowed, unless the
137 1.75 riastrad * device has affirmatively set D_NEGOFFSAFE.
138 1.22 drochner */
139 1.75 riastrad if ((cdev->d_flag & D_NEGOFFSAFE) == 0 && off != UVM_UNKNOWN_OFFSET) {
140 1.75 riastrad if (off < 0)
141 1.75 riastrad return NULL;
142 1.75 riastrad if (size > __type_max(voff_t))
143 1.75 riastrad return NULL;
144 1.75 riastrad if (off > __type_max(voff_t) - size)
145 1.75 riastrad return NULL;
146 1.75 riastrad }
147 1.13 cgd
148 1.13 cgd /*
149 1.13 cgd * Check that the specified range of the device allows the
150 1.13 cgd * desired protection.
151 1.34 chs *
152 1.13 cgd * XXX assumes VM_PROT_* == PROT_*
153 1.13 cgd * XXX clobbers off and size, but nothing else here needs them.
154 1.13 cgd */
155 1.13 cgd
156 1.13 cgd while (size != 0) {
157 1.52 ad if (cdev_mmap(device, off, accessprot) == -1) {
158 1.13 cgd return (NULL);
159 1.52 ad }
160 1.16 drochner off += PAGE_SIZE; size -= PAGE_SIZE;
161 1.13 cgd }
162 1.7 mrg
163 1.7 mrg /*
164 1.7 mrg * keep looping until we get it
165 1.7 mrg */
166 1.7 mrg
167 1.30 chs for (;;) {
168 1.7 mrg
169 1.7 mrg /*
170 1.34 chs * first, attempt to find it on the main list
171 1.7 mrg */
172 1.7 mrg
173 1.53 ad mutex_enter(&udv_lock);
174 1.30 chs LIST_FOREACH(lcv, &udv_list, u_list) {
175 1.7 mrg if (device == lcv->u_device)
176 1.7 mrg break;
177 1.7 mrg }
178 1.7 mrg
179 1.7 mrg /*
180 1.7 mrg * got it on main list. put a hold on it and unlock udv_lock.
181 1.7 mrg */
182 1.7 mrg
183 1.7 mrg if (lcv) {
184 1.7 mrg
185 1.7 mrg /*
186 1.7 mrg * if someone else has a hold on it, sleep and start
187 1.7 mrg * over again.
188 1.7 mrg */
189 1.7 mrg
190 1.7 mrg if (lcv->u_flags & UVM_DEVICE_HOLD) {
191 1.7 mrg lcv->u_flags |= UVM_DEVICE_WANTED;
192 1.49 thorpej UVM_UNLOCK_AND_WAIT(lcv, &udv_lock, false,
193 1.7 mrg "udv_attach",0);
194 1.7 mrg continue;
195 1.7 mrg }
196 1.7 mrg
197 1.7 mrg /* we are now holding it */
198 1.7 mrg lcv->u_flags |= UVM_DEVICE_HOLD;
199 1.53 ad mutex_exit(&udv_lock);
200 1.7 mrg
201 1.7 mrg /*
202 1.7 mrg * bump reference count, unhold, return.
203 1.7 mrg */
204 1.7 mrg
205 1.69 ad rw_enter(lcv->u_obj.vmobjlock, RW_WRITER);
206 1.7 mrg lcv->u_obj.uo_refs++;
207 1.69 ad rw_exit(lcv->u_obj.vmobjlock);
208 1.30 chs
209 1.53 ad mutex_enter(&udv_lock);
210 1.7 mrg if (lcv->u_flags & UVM_DEVICE_WANTED)
211 1.7 mrg wakeup(lcv);
212 1.7 mrg lcv->u_flags &= ~(UVM_DEVICE_WANTED|UVM_DEVICE_HOLD);
213 1.53 ad mutex_exit(&udv_lock);
214 1.76 riastrad return &lcv->u_obj;
215 1.7 mrg }
216 1.7 mrg
217 1.7 mrg /*
218 1.61 rmind * Did not find it on main list. Need to allocate a new one.
219 1.7 mrg */
220 1.7 mrg
221 1.53 ad mutex_exit(&udv_lock);
222 1.62 rmind
223 1.62 rmind /* Note: both calls may allocate memory and sleep. */
224 1.63 para udv = kmem_alloc(sizeof(*udv), KM_SLEEP);
225 1.62 rmind uvm_obj_init(&udv->u_obj, &uvm_deviceops, true, 1);
226 1.62 rmind
227 1.53 ad mutex_enter(&udv_lock);
228 1.7 mrg
229 1.7 mrg /*
230 1.7 mrg * now we have to double check to make sure no one added it
231 1.7 mrg * to the list while we were sleeping...
232 1.7 mrg */
233 1.7 mrg
234 1.30 chs LIST_FOREACH(lcv, &udv_list, u_list) {
235 1.7 mrg if (device == lcv->u_device)
236 1.7 mrg break;
237 1.7 mrg }
238 1.7 mrg
239 1.7 mrg /*
240 1.30 chs * did we lose a race to someone else?
241 1.30 chs * free our memory and retry.
242 1.7 mrg */
243 1.7 mrg
244 1.7 mrg if (lcv) {
245 1.53 ad mutex_exit(&udv_lock);
246 1.62 rmind uvm_obj_destroy(&udv->u_obj, true);
247 1.63 para kmem_free(udv, sizeof(*udv));
248 1.7 mrg continue;
249 1.7 mrg }
250 1.7 mrg
251 1.7 mrg /*
252 1.7 mrg * we have it! init the data structures, add to list
253 1.7 mrg * and return.
254 1.7 mrg */
255 1.7 mrg
256 1.7 mrg udv->u_flags = 0;
257 1.7 mrg udv->u_device = device;
258 1.7 mrg LIST_INSERT_HEAD(&udv_list, udv, u_list);
259 1.53 ad mutex_exit(&udv_lock);
260 1.76 riastrad return &udv->u_obj;
261 1.30 chs }
262 1.7 mrg /*NOTREACHED*/
263 1.1 mrg }
264 1.34 chs
265 1.1 mrg /*
266 1.1 mrg * udv_reference
267 1.1 mrg *
268 1.1 mrg * add a reference to a VM object. Note that the reference count must
269 1.1 mrg * already be one (the passed in reference) so there is no chance of the
270 1.1 mrg * udv being released or locked out here.
271 1.1 mrg *
272 1.1 mrg * => caller must call with object unlocked.
273 1.1 mrg */
274 1.1 mrg
275 1.7 mrg static void
276 1.44 thorpej udv_reference(struct uvm_object *uobj)
277 1.1 mrg {
278 1.71 skrll UVMHIST_FUNC(__func__); UVMHIST_CALLED(maphist);
279 1.1 mrg
280 1.69 ad rw_enter(uobj->vmobjlock, RW_WRITER);
281 1.7 mrg uobj->uo_refs++;
282 1.70 rin UVMHIST_LOG(maphist, "<- done (uobj=%#jx, ref = %jd)",
283 1.66 pgoyette (uintptr_t)uobj, uobj->uo_refs,0,0);
284 1.69 ad rw_exit(uobj->vmobjlock);
285 1.1 mrg }
286 1.1 mrg
287 1.1 mrg /*
288 1.1 mrg * udv_detach
289 1.1 mrg *
290 1.1 mrg * remove a reference to a VM object.
291 1.1 mrg *
292 1.1 mrg * => caller must call with object unlocked and map locked.
293 1.1 mrg */
294 1.1 mrg
295 1.7 mrg static void
296 1.44 thorpej udv_detach(struct uvm_object *uobj)
297 1.1 mrg {
298 1.30 chs struct uvm_device *udv = (struct uvm_device *)uobj;
299 1.71 skrll UVMHIST_FUNC(__func__); UVMHIST_CALLED(maphist);
300 1.1 mrg
301 1.7 mrg /*
302 1.7 mrg * loop until done
303 1.7 mrg */
304 1.24 pk again:
305 1.69 ad rw_enter(uobj->vmobjlock, RW_WRITER);
306 1.24 pk if (uobj->uo_refs > 1) {
307 1.30 chs uobj->uo_refs--;
308 1.69 ad rw_exit(uobj->vmobjlock);
309 1.70 rin UVMHIST_LOG(maphist," <- done, uobj=%#jx, ref=%jd",
310 1.66 pgoyette (uintptr_t)uobj,uobj->uo_refs,0,0);
311 1.24 pk return;
312 1.24 pk }
313 1.1 mrg
314 1.24 pk /*
315 1.30 chs * is it being held? if so, wait until others are done.
316 1.24 pk */
317 1.30 chs
318 1.53 ad mutex_enter(&udv_lock);
319 1.24 pk if (udv->u_flags & UVM_DEVICE_HOLD) {
320 1.24 pk udv->u_flags |= UVM_DEVICE_WANTED;
321 1.69 ad rw_exit(uobj->vmobjlock);
322 1.49 thorpej UVM_UNLOCK_AND_WAIT(udv, &udv_lock, false, "udv_detach",0);
323 1.24 pk goto again;
324 1.24 pk }
325 1.1 mrg
326 1.24 pk /*
327 1.24 pk * got it! nuke it now.
328 1.24 pk */
329 1.30 chs
330 1.24 pk LIST_REMOVE(udv, u_list);
331 1.24 pk if (udv->u_flags & UVM_DEVICE_WANTED)
332 1.24 pk wakeup(udv);
333 1.53 ad mutex_exit(&udv_lock);
334 1.69 ad rw_exit(uobj->vmobjlock);
335 1.62 rmind
336 1.62 rmind uvm_obj_destroy(uobj, true);
337 1.63 para kmem_free(udv, sizeof(*udv));
338 1.70 rin UVMHIST_LOG(maphist," <- done, freed uobj=%#jx", (uintptr_t)uobj,
339 1.66 pgoyette 0, 0, 0);
340 1.1 mrg }
341 1.1 mrg
342 1.1 mrg /*
343 1.1 mrg * udv_fault: non-standard fault routine for device "pages"
344 1.1 mrg *
345 1.1 mrg * => rather than having a "get" function, we have a fault routine
346 1.1 mrg * since we don't return vm_pages we need full control over the
347 1.1 mrg * pmap_enter map in
348 1.1 mrg * => all the usual fault data structured are locked by the caller
349 1.1 mrg * (i.e. maps(read), amap (if any), uobj)
350 1.1 mrg * => on return, we unlock all fault data structures
351 1.1 mrg * => flags: PGO_ALLPAGES: get all of the pages
352 1.1 mrg * PGO_LOCKED: fault data structures are locked
353 1.1 mrg * XXX: currently PGO_LOCKED is always required ... consider removing
354 1.1 mrg * it as a flag
355 1.1 mrg * => NOTE: vaddr is the VA of pps[0] in ufi->entry, _NOT_ pps[centeridx]
356 1.1 mrg */
357 1.1 mrg
358 1.7 mrg static int
359 1.44 thorpej udv_fault(struct uvm_faultinfo *ufi, vaddr_t vaddr, struct vm_page **pps,
360 1.47 drochner int npages, int centeridx, vm_prot_t access_type,
361 1.44 thorpej int flags)
362 1.1 mrg {
363 1.7 mrg struct vm_map_entry *entry = ufi->entry;
364 1.7 mrg struct uvm_object *uobj = entry->object.uvm_obj;
365 1.7 mrg struct uvm_device *udv = (struct uvm_device *)uobj;
366 1.20 kleink vaddr_t curr_va;
367 1.27 simonb off_t curr_offset;
368 1.25 simonb paddr_t paddr, mdpgno;
369 1.59 jmcneill u_int mmapflags;
370 1.25 simonb int lcv, retval;
371 1.7 mrg dev_t device;
372 1.17 ross vm_prot_t mapprot;
373 1.71 skrll UVMHIST_FUNC(__func__); UVMHIST_CALLED(maphist);
374 1.72 skrll UVMHIST_LOG(maphist," flags=%#jx", flags,0,0,0);
375 1.7 mrg
376 1.7 mrg /*
377 1.7 mrg * we do not allow device mappings to be mapped copy-on-write
378 1.7 mrg * so we kill any attempt to do so here.
379 1.7 mrg */
380 1.34 chs
381 1.7 mrg if (UVM_ET_ISCOPYONWRITE(entry)) {
382 1.70 rin UVMHIST_LOG(maphist, "<- failed -- COW entry (etype=%#jx)",
383 1.66 pgoyette entry->etype, 0,0,0);
384 1.62 rmind uvmfault_unlockall(ufi, ufi->entry->aref.ar_amap, uobj);
385 1.76 riastrad return EIO;
386 1.7 mrg }
387 1.7 mrg
388 1.7 mrg /*
389 1.34 chs * get device map function.
390 1.7 mrg */
391 1.30 chs
392 1.7 mrg device = udv->u_device;
393 1.52 ad if (cdevsw_lookup(device) == NULL) {
394 1.52 ad /* XXX This should not happen */
395 1.62 rmind uvmfault_unlockall(ufi, ufi->entry->aref.ar_amap, uobj);
396 1.76 riastrad return EIO;
397 1.41 gehenna }
398 1.7 mrg
399 1.7 mrg /*
400 1.10 chuck * now we must determine the offset in udv to use and the VA to
401 1.10 chuck * use for pmap_enter. note that we always use orig_map's pmap
402 1.10 chuck * for pmap_enter (even if we have a submap). since virtual
403 1.10 chuck * addresses in a submap must match the main map, this is ok.
404 1.7 mrg */
405 1.30 chs
406 1.7 mrg /* udv offset = (offset from start of entry) + entry's offset */
407 1.27 simonb curr_offset = entry->offset + (vaddr - entry->start);
408 1.10 chuck /* pmap va = vaddr (virtual address of pps[0]) */
409 1.10 chuck curr_va = vaddr;
410 1.34 chs
411 1.7 mrg /*
412 1.7 mrg * loop over the page range entering in as needed
413 1.7 mrg */
414 1.7 mrg
415 1.31 chs retval = 0;
416 1.7 mrg for (lcv = 0 ; lcv < npages ; lcv++, curr_offset += PAGE_SIZE,
417 1.7 mrg curr_va += PAGE_SIZE) {
418 1.7 mrg if ((flags & PGO_ALLPAGES) == 0 && lcv != centeridx)
419 1.7 mrg continue;
420 1.7 mrg
421 1.7 mrg if (pps[lcv] == PGO_DONTCARE)
422 1.7 mrg continue;
423 1.7 mrg
424 1.52 ad mdpgno = cdev_mmap(device, curr_offset, access_type);
425 1.11 mrg if (mdpgno == -1) {
426 1.31 chs retval = EIO;
427 1.7 mrg break;
428 1.7 mrg }
429 1.11 mrg paddr = pmap_phys_address(mdpgno);
430 1.59 jmcneill mmapflags = pmap_mmap_flags(mdpgno);
431 1.17 ross mapprot = ufi->entry->protection;
432 1.7 mrg UVMHIST_LOG(maphist,
433 1.70 rin " MAPPING: device: pm=%#jx, va=%#jx, pa=%#jx, at=%jd",
434 1.66 pgoyette (uintptr_t)ufi->orig_map->pmap, curr_va, paddr, mapprot);
435 1.59 jmcneill if (pmap_enter(ufi->orig_map->pmap, curr_va, paddr, mapprot,
436 1.59 jmcneill PMAP_CANFAIL | mapprot | mmapflags) != 0) {
437 1.18 thorpej /*
438 1.18 thorpej * pmap_enter() didn't have the resource to
439 1.18 thorpej * enter this mapping. Unlock everything,
440 1.18 thorpej * wait for the pagedaemon to free up some
441 1.18 thorpej * pages, and then tell uvm_fault() to start
442 1.18 thorpej * the fault again.
443 1.18 thorpej *
444 1.18 thorpej * XXX Needs some rethinking for the PGO_ALLPAGES
445 1.18 thorpej * XXX case.
446 1.18 thorpej */
447 1.54 ad pmap_update(ufi->orig_map->pmap); /* sync what we have so far */
448 1.18 thorpej uvmfault_unlockall(ufi, ufi->entry->aref.ar_amap,
449 1.62 rmind uobj);
450 1.68 chs return ENOMEM;
451 1.18 thorpej }
452 1.7 mrg }
453 1.1 mrg
454 1.54 ad pmap_update(ufi->orig_map->pmap);
455 1.62 rmind uvmfault_unlockall(ufi, ufi->entry->aref.ar_amap, uobj);
456 1.76 riastrad return retval;
457 1.1 mrg }
458