iommu.c revision 1.51.4.5 1 /* $NetBSD: iommu.c,v 1.51.4.5 2002/11/08 09:24:57 tron Exp $ */
2
3 /*
4 * Copyright (c) 2001, 2002 Eduardo Horvath
5 * Copyright (c) 1999, 2000 Matthew R. Green
6 * All rights reserved.
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
10 * are met:
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in the
15 * documentation and/or other materials provided with the distribution.
16 * 3. The name of the author may not be used to endorse or promote products
17 * derived from this software without specific prior written permission.
18 *
19 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
20 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
21 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
22 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
23 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
24 * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
25 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
26 * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
27 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 * SUCH DAMAGE.
30 */
31
32 /*
33 * UltraSPARC IOMMU support; used by both the sbus and pci code.
34 */
35 #include "opt_ddb.h"
36
37 #include <sys/param.h>
38 #include <sys/extent.h>
39 #include <sys/malloc.h>
40 #include <sys/systm.h>
41 #include <sys/device.h>
42 #include <sys/proc.h>
43
44 #include <uvm/uvm_extern.h>
45
46 #include <machine/bus.h>
47 #include <sparc64/sparc64/cache.h>
48 #include <sparc64/dev/iommureg.h>
49 #include <sparc64/dev/iommuvar.h>
50
51 #include <machine/autoconf.h>
52 #include <machine/cpu.h>
53
54 #ifdef DEBUG
55 #define IDB_BUSDMA 0x1
56 #define IDB_IOMMU 0x2
57 #define IDB_INFO 0x4
58 #define IDB_SYNC 0x8
59 int iommudebug = 0x0;
60 #define DPRINTF(l, s) do { if (iommudebug & l) printf s; } while (0)
61 #else
62 #define DPRINTF(l, s)
63 #endif
64
65 #define iommu_strbuf_flush(i, v) do { \
66 if ((i)->sb_flush) \
67 bus_space_write_8((i)->sb_is->is_bustag, (i)->sb_sb, \
68 STRBUFREG(strbuf_pgflush), (v)); \
69 } while (0)
70
71 static int iommu_strbuf_flush_done __P((struct strbuf_ctl *));
72
73 /*
74 * initialise the UltraSPARC IOMMU (SBUS or PCI):
75 * - allocate and setup the iotsb.
76 * - enable the IOMMU
77 * - initialise the streaming buffers (if they exist)
78 * - create a private DVMA map.
79 */
80 void
81 iommu_init(name, is, tsbsize, iovabase)
82 char *name;
83 struct iommu_state *is;
84 int tsbsize;
85 u_int32_t iovabase;
86 {
87 psize_t size;
88 vaddr_t va;
89 paddr_t pa;
90 struct vm_page *m;
91 struct pglist mlist;
92
93 /*
94 * Setup the iommu.
95 *
96 * The sun4u iommu is part of the SBUS or PCI controller so we will
97 * deal with it here..
98 *
99 * For sysio and psycho/psycho+ the IOMMU address space always ends at
100 * 0xffffe000, but the starting address depends on the size of the
101 * map. The map size is 1024 * 2 ^ is->is_tsbsize entries, where each
102 * entry is 8 bytes. The start of the map can be calculated by
103 * (0xffffe000 << (8 + is->is_tsbsize)).
104 *
105 * But sabre and hummingbird use a different scheme that seems to
106 * be hard-wired, so we read the start and size from the PROM and
107 * just use those values.
108 */
109 is->is_cr = (tsbsize << 16) | IOMMUCR_EN;
110 is->is_tsbsize = tsbsize;
111 if (iovabase == -1) {
112 is->is_dvmabase = IOTSB_VSTART(is->is_tsbsize);
113 is->is_dvmaend = IOTSB_VEND;
114 } else {
115 is->is_dvmabase = iovabase;
116 is->is_dvmaend = iovabase + IOTSB_VSIZE(tsbsize);
117 }
118
119 /*
120 * Allocate memory for I/O pagetables. They need to be physically
121 * contiguous.
122 */
123
124 size = NBPG<<(is->is_tsbsize);
125 TAILQ_INIT(&mlist);
126 if (uvm_pglistalloc((psize_t)size, (paddr_t)0, (paddr_t)-1,
127 (paddr_t)NBPG, (paddr_t)0, &mlist, 1, 0) != 0)
128 panic("iommu_init: no memory");
129
130 va = uvm_km_valloc(kernel_map, size);
131 if (va == 0)
132 panic("iommu_init: no memory");
133 is->is_tsb = (int64_t *)va;
134
135 m = TAILQ_FIRST(&mlist);
136 is->is_ptsb = VM_PAGE_TO_PHYS(m);
137
138 /* Map the pages */
139 for (; m != NULL; m = TAILQ_NEXT(m,pageq)) {
140 pa = VM_PAGE_TO_PHYS(m);
141 pmap_enter(pmap_kernel(), va, pa | PMAP_NVC,
142 VM_PROT_READ|VM_PROT_WRITE,
143 VM_PROT_READ|VM_PROT_WRITE|PMAP_WIRED);
144 va += NBPG;
145 }
146 pmap_update(pmap_kernel());
147 bzero(is->is_tsb, size);
148
149 #ifdef DEBUG
150 if (iommudebug & IDB_INFO)
151 {
152 /* Probe the iommu */
153
154 printf("iommu regs at: cr=%lx tsb=%lx flush=%lx\n",
155 (u_long)bus_space_read_8(is->is_bustag, is->is_iommu,
156 offsetof (struct iommureg, iommu_cr)),
157 (u_long)bus_space_read_8(is->is_bustag, is->is_iommu,
158 offsetof (struct iommureg, iommu_tsb)),
159 (u_long)bus_space_read_8(is->is_bustag, is->is_iommu,
160 offsetof (struct iommureg, iommu_flush)));
161 printf("iommu cr=%llx tsb=%llx\n",
162 (unsigned long long)bus_space_read_8(is->is_bustag,
163 is->is_iommu,
164 offsetof (struct iommureg, iommu_cr)),
165 (unsigned long long)bus_space_read_8(is->is_bustag,
166 is->is_iommu,
167 offsetof (struct iommureg, iommu_tsb)));
168 printf("TSB base %p phys %llx\n", (void *)is->is_tsb,
169 (unsigned long long)is->is_ptsb);
170 delay(1000000); /* 1 s */
171 }
172 #endif
173
174 /*
175 * now actually start up the IOMMU
176 */
177 iommu_reset(is);
178
179 /*
180 * Now all the hardware's working we need to allocate a dvma map.
181 */
182 printf("DVMA map: %x to %x\n",
183 (unsigned int)is->is_dvmabase,
184 (unsigned int)is->is_dvmaend);
185 printf("IOTSB: %llx to %llx\n",
186 (unsigned long long)is->is_ptsb,
187 (unsigned long long)(is->is_ptsb + size));
188 is->is_dvmamap = extent_create(name,
189 is->is_dvmabase, is->is_dvmaend - NBPG,
190 M_DEVBUF, 0, 0, EX_NOWAIT);
191 }
192
193 /*
194 * Streaming buffers don't exist on the UltraSPARC IIi; we should have
195 * detected that already and disabled them. If not, we will notice that
196 * they aren't there when the STRBUF_EN bit does not remain.
197 */
198 void
199 iommu_reset(is)
200 struct iommu_state *is;
201 {
202 int i;
203 struct strbuf_ctl *sb;
204
205 /* Need to do 64-bit stores */
206 bus_space_write_8(is->is_bustag, is->is_iommu, IOMMUREG(iommu_tsb),
207 is->is_ptsb);
208
209 /* Enable IOMMU in diagnostic mode */
210 bus_space_write_8(is->is_bustag, is->is_iommu, IOMMUREG(iommu_cr),
211 is->is_cr|IOMMUCR_DE);
212
213 for (i=0; i<2; i++) {
214 if ((sb = is->is_sb[i])) {
215
216 /* Enable diagnostics mode? */
217 bus_space_write_8(is->is_bustag, is->is_sb[i]->sb_sb,
218 STRBUFREG(strbuf_ctl), STRBUF_EN);
219
220 /* No streaming buffers? Disable them */
221 if (bus_space_read_8(is->is_bustag,
222 is->is_sb[i]->sb_sb,
223 STRBUFREG(strbuf_ctl)) == 0) {
224 is->is_sb[i]->sb_flush = NULL;
225 } else {
226 /*
227 * locate the pa of the flush buffer.
228 */
229 (void)pmap_extract(pmap_kernel(),
230 (vaddr_t)is->is_sb[i]->sb_flush,
231 &is->is_sb[i]->sb_flushpa);
232 }
233 }
234 }
235 }
236
237 /*
238 * Here are the iommu control routines.
239 */
240 void
241 iommu_enter(sb, va, pa, flags)
242 struct strbuf_ctl *sb;
243 vaddr_t va;
244 int64_t pa;
245 int flags;
246 {
247 struct iommu_state *is = sb->sb_is;
248 int strbuf = (flags & BUS_DMA_STREAMING);
249 int64_t tte;
250
251 #ifdef DIAGNOSTIC
252 if (va < is->is_dvmabase || va > is->is_dvmaend)
253 panic("iommu_enter: va %#lx not in DVMA space", va);
254 #endif
255
256 /* Is the streamcache flush really needed? */
257 if (sb->sb_flush) {
258 iommu_strbuf_flush(sb, va);
259 iommu_strbuf_flush_done(sb);
260 } else
261 /* If we can't flush the strbuf don't enable it. */
262 strbuf = 0;
263
264 tte = MAKEIOTTE(pa, !(flags & BUS_DMA_NOWRITE),
265 !(flags & BUS_DMA_NOCACHE), (strbuf));
266 #ifdef DEBUG
267 tte |= (flags & 0xff000LL)<<(4*8);
268 #endif
269
270 DPRINTF(IDB_IOMMU, ("Clearing TSB slot %d for va %p\n",
271 (int)IOTSBSLOT(va,is->is_tsbsize), (void *)(u_long)va));
272 is->is_tsb[IOTSBSLOT(va,is->is_tsbsize)] = tte;
273 bus_space_write_8(is->is_bustag, is->is_iommu,
274 IOMMUREG(iommu_flush), va);
275 DPRINTF(IDB_IOMMU, ("iommu_enter: va %lx pa %lx TSB[%lx]@%p=%lx\n",
276 va, (long)pa, (u_long)IOTSBSLOT(va,is->is_tsbsize),
277 (void *)(u_long)&is->is_tsb[IOTSBSLOT(va,is->is_tsbsize)],
278 (u_long)tte));
279 }
280
281
282 /*
283 * Find the value of a DVMA address (debug routine).
284 */
285 paddr_t
286 iommu_extract(is, dva)
287 struct iommu_state *is;
288 vaddr_t dva;
289 {
290 int64_t tte = 0;
291
292 if (dva >= is->is_dvmabase && dva < is->is_dvmaend)
293 tte = is->is_tsb[IOTSBSLOT(dva, is->is_tsbsize)];
294
295 if ((tte & IOTTE_V) == 0)
296 return ((paddr_t)-1L);
297 return (tte & IOTTE_PAMASK);
298 }
299
300 /*
301 * iommu_remove: removes mappings created by iommu_enter
302 *
303 * Only demap from IOMMU if flag is set.
304 *
305 * XXX: this function needs better internal error checking.
306 */
307 void
308 iommu_remove(is, va, len)
309 struct iommu_state *is;
310 vaddr_t va;
311 size_t len;
312 {
313
314 #ifdef DIAGNOSTIC
315 if (va < is->is_dvmabase || va > is->is_dvmaend)
316 panic("iommu_remove: va 0x%lx not in DVMA space", (u_long)va);
317 if ((long)(va + len) < (long)va)
318 panic("iommu_remove: va 0x%lx + len 0x%lx wraps",
319 (long) va, (long) len);
320 if (len & ~0xfffffff)
321 panic("iommu_remove: rediculous len 0x%lx", (u_long)len);
322 #endif
323
324 va = trunc_page(va);
325 DPRINTF(IDB_IOMMU, ("iommu_remove: va %lx TSB[%lx]@%p\n",
326 va, (u_long)IOTSBSLOT(va, is->is_tsbsize),
327 &is->is_tsb[IOTSBSLOT(va, is->is_tsbsize)]));
328 while (len > 0) {
329 DPRINTF(IDB_IOMMU, ("iommu_remove: clearing TSB slot %d "
330 "for va %p size %lx\n",
331 (int)IOTSBSLOT(va,is->is_tsbsize), (void *)(u_long)va,
332 (u_long)len));
333 if (len <= NBPG)
334 len = 0;
335 else
336 len -= NBPG;
337
338 /* XXX Zero-ing the entry would not require RMW */
339 is->is_tsb[IOTSBSLOT(va,is->is_tsbsize)] &= ~IOTTE_V;
340 bus_space_write_8(is->is_bustag, is->is_iommu,
341 IOMMUREG(iommu_flush), va);
342 va += NBPG;
343 }
344 }
345
346 static int
347 iommu_strbuf_flush_done(sb)
348 struct strbuf_ctl *sb;
349 {
350 struct iommu_state *is = sb->sb_is;
351 struct timeval cur, flushtimeout;
352
353 #define BUMPTIME(t, usec) { \
354 register volatile struct timeval *tp = (t); \
355 register long us; \
356 \
357 tp->tv_usec = us = tp->tv_usec + (usec); \
358 if (us >= 1000000) { \
359 tp->tv_usec = us - 1000000; \
360 tp->tv_sec++; \
361 } \
362 }
363
364 if (!sb->sb_flush)
365 return (0);
366
367 /*
368 * Streaming buffer flushes:
369 *
370 * 1 Tell strbuf to flush by storing va to strbuf_pgflush. If
371 * we're not on a cache line boundary (64-bits):
372 * 2 Store 0 in flag
373 * 3 Store pointer to flag in flushsync
374 * 4 wait till flushsync becomes 0x1
375 *
376 * If it takes more than .5 sec, something
377 * went wrong.
378 */
379
380 *sb->sb_flush = 0;
381 bus_space_write_8(is->is_bustag, sb->sb_sb,
382 STRBUFREG(strbuf_flushsync), sb->sb_flushpa);
383
384 microtime(&flushtimeout);
385 cur = flushtimeout;
386 BUMPTIME(&flushtimeout, 500000); /* 1/2 sec */
387
388 DPRINTF(IDB_IOMMU, ("iommu_strbuf_flush_done: flush = %lx "
389 "at va = %lx pa = %lx now=%lx:%lx until = %lx:%lx\n",
390 (long)*sb->sb_flush, (long)sb->sb_flush, (long)sb->sb_flushpa,
391 cur.tv_sec, cur.tv_usec,
392 flushtimeout.tv_sec, flushtimeout.tv_usec));
393
394 /* Bypass non-coherent D$ */
395 while ((!ldxa(sb->sb_flushpa, ASI_PHYS_CACHED)) &&
396 ((cur.tv_sec <= flushtimeout.tv_sec) &&
397 (cur.tv_usec <= flushtimeout.tv_usec)))
398 microtime(&cur);
399
400 #ifdef DIAGNOSTIC
401 if (!ldxa(sb->sb_flushpa, ASI_PHYS_CACHED)) {
402 printf("iommu_strbuf_flush_done: flush timeout %p, at %p\n",
403 (void *)(u_long)*sb->sb_flush,
404 (void *)(u_long)sb->sb_flushpa); /* panic? */
405 #ifdef DDB
406 Debugger();
407 #endif
408 }
409 #endif
410 DPRINTF(IDB_IOMMU, ("iommu_strbuf_flush_done: flushed\n"));
411 return (*sb->sb_flush);
412 }
413
414 /*
415 * IOMMU DVMA operations, common to SBUS and PCI.
416 */
417 int
418 iommu_dvmamap_load(t, sb, map, buf, buflen, p, flags)
419 bus_dma_tag_t t;
420 struct strbuf_ctl *sb;
421 bus_dmamap_t map;
422 void *buf;
423 bus_size_t buflen;
424 struct proc *p;
425 int flags;
426 {
427 struct iommu_state *is = sb->sb_is;
428 int s;
429 int err;
430 bus_size_t sgsize;
431 paddr_t curaddr;
432 u_long dvmaddr, sgstart, sgend;
433 bus_size_t align, boundary;
434 vaddr_t vaddr = (vaddr_t)buf;
435 int seg;
436 pmap_t pmap;
437
438 if (map->dm_nsegs) {
439 /* Already in use?? */
440 #ifdef DIAGNOSTIC
441 printf("iommu_dvmamap_load: map still in use\n");
442 #endif
443 bus_dmamap_unload(t, map);
444 }
445 /*
446 * Make sure that on error condition we return "no valid mappings".
447 */
448 map->dm_nsegs = 0;
449
450 if (buflen > map->_dm_size) {
451 DPRINTF(IDB_BUSDMA,
452 ("iommu_dvmamap_load(): error %d > %d -- "
453 "map size exceeded!\n", (int)buflen, (int)map->_dm_size));
454 return (EINVAL);
455 }
456
457 sgsize = round_page(buflen + ((int)vaddr & PGOFSET));
458
459 /*
460 * A boundary presented to bus_dmamem_alloc() takes precedence
461 * over boundary in the map.
462 */
463 if ((boundary = (map->dm_segs[0]._ds_boundary)) == 0)
464 boundary = map->_dm_boundary;
465 align = max(map->dm_segs[0]._ds_align, NBPG);
466 s = splhigh();
467 /*
468 * If our segment size is larger than the boundary we need to
469 * split the transfer up int little pieces ourselves.
470 */
471 err = extent_alloc(is->is_dvmamap, sgsize, align,
472 (sgsize > boundary) ? 0 : boundary,
473 EX_NOWAIT|EX_BOUNDZERO, &dvmaddr);
474 splx(s);
475
476 #ifdef DEBUG
477 if (err || (dvmaddr == (bus_addr_t)-1))
478 {
479 printf("iommu_dvmamap_load(): extent_alloc(%d, %x) failed!\n",
480 (int)sgsize, flags);
481 #ifdef DDB
482 Debugger();
483 #endif
484 }
485 #endif
486 if (err != 0)
487 return (err);
488
489 if (dvmaddr == (bus_addr_t)-1)
490 return (ENOMEM);
491
492 /* Set the active DVMA map */
493 map->_dm_dvmastart = dvmaddr;
494 map->_dm_dvmasize = sgsize;
495
496 /*
497 * Now split the DVMA range into segments, not crossing
498 * the boundary.
499 */
500 seg = 0;
501 sgstart = dvmaddr + (vaddr & PGOFSET);
502 sgend = sgstart + buflen - 1;
503 map->dm_segs[seg].ds_addr = sgstart;
504 DPRINTF(IDB_INFO, ("iommu_dvmamap_load: boundary %lx boundary-1 %lx "
505 "~(boundary-1) %lx\n", (long)boundary, (long)(boundary-1), (long)~(boundary-1)));
506 while ((sgstart & ~(boundary - 1)) != (sgend & ~(boundary - 1))) {
507 /* Oops. We crossed a boundary. Split the xfer. */
508 DPRINTF(IDB_INFO, ("iommu_dvmamap_load: "
509 "seg %d start %lx size %lx\n", seg,
510 (long)map->dm_segs[seg].ds_addr,
511 (long)map->dm_segs[seg].ds_len));
512 map->dm_segs[seg].ds_len =
513 boundary - (sgstart & (boundary - 1));
514 if (++seg >= map->_dm_segcnt) {
515 /* Too many segments. Fail the operation. */
516 DPRINTF(IDB_INFO, ("iommu_dvmamap_load: "
517 "too many segments %d\n", seg));
518 s = splhigh();
519 /* How can this fail? And if it does what can we do? */
520 err = extent_free(is->is_dvmamap,
521 dvmaddr, sgsize, EX_NOWAIT);
522 map->_dm_dvmastart = 0;
523 map->_dm_dvmasize = 0;
524 splx(s);
525 return (E2BIG);
526 }
527 sgstart = roundup(sgstart, boundary);
528 map->dm_segs[seg].ds_addr = sgstart;
529 }
530 map->dm_segs[seg].ds_len = sgend - sgstart + 1;
531 DPRINTF(IDB_INFO, ("iommu_dvmamap_load: "
532 "seg %d start %lx size %lx\n", seg,
533 (long)map->dm_segs[seg].ds_addr, (long)map->dm_segs[seg].ds_len));
534 map->dm_nsegs = seg+1;
535 map->dm_mapsize = buflen;
536
537 if (p != NULL)
538 pmap = p->p_vmspace->vm_map.pmap;
539 else
540 pmap = pmap_kernel();
541
542 for (; buflen > 0; ) {
543 /*
544 * Get the physical address for this page.
545 */
546 if (pmap_extract(pmap, (vaddr_t)vaddr, &curaddr) == FALSE) {
547 bus_dmamap_unload(t, map);
548 return (-1);
549 }
550
551 /*
552 * Compute the segment size, and adjust counts.
553 */
554 sgsize = NBPG - ((u_long)vaddr & PGOFSET);
555 if (buflen < sgsize)
556 sgsize = buflen;
557
558 DPRINTF(IDB_BUSDMA,
559 ("iommu_dvmamap_load: map %p loading va %p "
560 "dva %lx at pa %lx\n",
561 map, (void *)vaddr, (long)dvmaddr,
562 (long)(curaddr & ~(NBPG-1))));
563 iommu_enter(sb, trunc_page(dvmaddr), trunc_page(curaddr),
564 flags|0x4000);
565
566 dvmaddr += PAGE_SIZE;
567 vaddr += sgsize;
568 buflen -= sgsize;
569 }
570 #ifdef DIAGNOSTIC
571 for (seg = 0; seg < map->dm_nsegs; seg++) {
572 if (map->dm_segs[seg].ds_addr < is->is_dvmabase ||
573 map->dm_segs[seg].ds_addr > is->is_dvmaend) {
574 printf("seg %d dvmaddr %lx out of range %x - %x\n",
575 seg, (long)map->dm_segs[seg].ds_addr,
576 is->is_dvmabase, is->is_dvmaend);
577 Debugger();
578 }
579 }
580 #endif
581 return (0);
582 }
583
584
585 void
586 iommu_dvmamap_unload(t, sb, map)
587 bus_dma_tag_t t;
588 struct strbuf_ctl *sb;
589 bus_dmamap_t map;
590 {
591 struct iommu_state *is = sb->sb_is;
592 int error, s;
593 bus_size_t sgsize;
594
595 /* Flush the iommu */
596 #ifdef DEBUG
597 if (!map->_dm_dvmastart) {
598 printf("iommu_dvmamap_unload: No dvmastart is zero\n");
599 #ifdef DDB
600 Debugger();
601 #endif
602 }
603 #endif
604 iommu_remove(is, map->_dm_dvmastart, map->_dm_dvmasize);
605
606 /* Flush the caches */
607 bus_dmamap_unload(t->_parent, map);
608
609 /* Mark the mappings as invalid. */
610 map->dm_mapsize = 0;
611 map->dm_nsegs = 0;
612
613 s = splhigh();
614 error = extent_free(is->is_dvmamap, map->_dm_dvmastart,
615 map->_dm_dvmasize, EX_NOWAIT);
616 map->_dm_dvmastart = 0;
617 map->_dm_dvmasize = 0;
618 splx(s);
619 if (error != 0)
620 printf("warning: %qd of DVMA space lost\n", (long long)sgsize);
621
622 /* Clear the map */
623 }
624
625
626 int
627 iommu_dvmamap_load_raw(t, sb, map, segs, nsegs, flags, size)
628 bus_dma_tag_t t;
629 struct strbuf_ctl *sb;
630 bus_dmamap_t map;
631 bus_dma_segment_t *segs;
632 int nsegs;
633 int flags;
634 bus_size_t size;
635 {
636 struct iommu_state *is = sb->sb_is;
637 struct vm_page *m;
638 int i, j, s;
639 int left;
640 int err;
641 bus_size_t sgsize;
642 paddr_t pa;
643 bus_size_t boundary, align;
644 u_long dvmaddr, sgstart, sgend;
645 struct pglist *mlist;
646 int pagesz = PAGE_SIZE;
647 int npg = 0; /* DEBUG */
648
649 if (map->dm_nsegs) {
650 /* Already in use?? */
651 #ifdef DIAGNOSTIC
652 printf("iommu_dvmamap_load_raw: map still in use\n");
653 #endif
654 bus_dmamap_unload(t, map);
655 }
656
657 /*
658 * A boundary presented to bus_dmamem_alloc() takes precedence
659 * over boundary in the map.
660 */
661 if ((boundary = segs[0]._ds_boundary) == 0)
662 boundary = map->_dm_boundary;
663
664 align = max(segs[0]._ds_align, pagesz);
665
666 /*
667 * Make sure that on error condition we return "no valid mappings".
668 */
669 map->dm_nsegs = 0;
670 /* Count up the total number of pages we need */
671 pa = segs[0].ds_addr;
672 sgsize = 0;
673 left = size;
674 for (i=0; left && i<nsegs; i++) {
675 if (round_page(pa) != round_page(segs[i].ds_addr))
676 sgsize = round_page(sgsize);
677 sgsize += min(left, segs[i].ds_len);
678 left -= segs[i].ds_len;
679 pa = segs[i].ds_addr + segs[i].ds_len;
680 }
681 sgsize = round_page(sgsize);
682
683 s = splhigh();
684 /*
685 * If our segment size is larger than the boundary we need to
686 * split the transfer up into little pieces ourselves.
687 */
688 err = extent_alloc(is->is_dvmamap, sgsize, align,
689 (sgsize > boundary) ? 0 : boundary,
690 ((flags & BUS_DMA_NOWAIT) == 0 ? EX_WAITOK : EX_NOWAIT) |
691 EX_BOUNDZERO, &dvmaddr);
692 splx(s);
693
694 if (err != 0)
695 return (err);
696
697 #ifdef DEBUG
698 if (dvmaddr == (bus_addr_t)-1)
699 {
700 printf("iommu_dvmamap_load_raw(): extent_alloc(%d, %x) failed!\n",
701 (int)sgsize, flags);
702 Debugger();
703 }
704 #endif
705 if (dvmaddr == (bus_addr_t)-1)
706 return (ENOMEM);
707
708 /* Set the active DVMA map */
709 map->_dm_dvmastart = dvmaddr;
710 map->_dm_dvmasize = sgsize;
711
712 if ((mlist = segs[0]._ds_mlist) == NULL) {
713 u_long prev_va = NULL;
714 paddr_t prev_pa = 0;
715 int end = 0, offset;
716
717 /*
718 * This segs is made up of individual physical
719 * segments, probably by _bus_dmamap_load_uio() or
720 * _bus_dmamap_load_mbuf(). Ignore the mlist and
721 * load each one individually.
722 */
723 map->dm_mapsize = size;
724
725 j = 0;
726 for (i = 0; i < nsegs ; i++) {
727
728 pa = segs[i].ds_addr;
729 offset = (pa & PGOFSET);
730 pa = trunc_page(pa);
731 dvmaddr = trunc_page(dvmaddr);
732 left = min(size, segs[i].ds_len);
733
734 DPRINTF(IDB_INFO, ("iommu_dvmamap_load_raw: converting "
735 "physseg %d start %lx size %lx\n", i,
736 (long)segs[i].ds_addr, (long)segs[i].ds_len));
737
738 if ((pa == prev_pa) &&
739 ((offset != 0) || (end != offset))) {
740 /* We can re-use this mapping */
741 dvmaddr = prev_va;
742 }
743
744 sgstart = dvmaddr + offset;
745 sgend = sgstart + left - 1;
746
747 /* Are the segments virtually adjacent? */
748 if ((j > 0) && (end == offset) &&
749 ((offset == 0) || (pa == prev_pa))) {
750 /* Just append to the previous segment. */
751 map->dm_segs[--j].ds_len += left;
752 DPRINTF(IDB_INFO, ("iommu_dvmamap_load_raw: "
753 "appending seg %d start %lx size %lx\n", j,
754 (long)map->dm_segs[j].ds_addr,
755 (long)map->dm_segs[j].ds_len));
756 } else {
757 if (j >= map->_dm_segcnt) {
758 iommu_dvmamap_unload(t, sb, map);
759 return (E2BIG);
760 }
761 map->dm_segs[j].ds_addr = sgstart;
762 map->dm_segs[j].ds_len = left;
763 DPRINTF(IDB_INFO, ("iommu_dvmamap_load_raw: "
764 "seg %d start %lx size %lx\n", j,
765 (long)map->dm_segs[j].ds_addr,
766 (long)map->dm_segs[j].ds_len));
767 }
768 end = (offset + left) & PGOFSET;
769
770 /* Check for boundary issues */
771 while ((sgstart & ~(boundary - 1)) !=
772 (sgend & ~(boundary - 1))) {
773 /* Need a new segment. */
774 map->dm_segs[j].ds_len =
775 boundary - (sgstart & (boundary - 1));
776 DPRINTF(IDB_INFO, ("iommu_dvmamap_load_raw: "
777 "seg %d start %lx size %lx\n", j,
778 (long)map->dm_segs[j].ds_addr,
779 (long)map->dm_segs[j].ds_len));
780 if (++j >= map->_dm_segcnt) {
781 iommu_dvmamap_unload(t, sb, map);
782 return (E2BIG);
783 }
784 sgstart = roundup(sgstart, boundary);
785 map->dm_segs[j].ds_addr = sgstart;
786 map->dm_segs[j].ds_len = sgend - sgstart + 1;
787 }
788
789 if (sgsize == 0)
790 panic("iommu_dmamap_load_raw: size botch");
791
792 /* Now map a series of pages. */
793 while (dvmaddr <= sgend) {
794 DPRINTF(IDB_BUSDMA,
795 ("iommu_dvmamap_load_raw: map %p "
796 "loading va %lx at pa %lx\n",
797 map, (long)dvmaddr,
798 (long)(pa)));
799 /* Enter it if we haven't before. */
800 if (prev_va != dvmaddr)
801 iommu_enter(sb, prev_va = dvmaddr,
802 prev_pa = pa,
803 flags|(++npg<<12));
804 dvmaddr += pagesz;
805 pa += pagesz;
806 }
807
808 size -= left;
809 ++j;
810 }
811
812 map->dm_nsegs = j;
813 #ifdef DIAGNOSTIC
814 { int seg;
815 for (seg = 0; seg < map->dm_nsegs; seg++) {
816 if (map->dm_segs[seg].ds_addr < is->is_dvmabase ||
817 map->dm_segs[seg].ds_addr > is->is_dvmaend) {
818 printf("seg %d dvmaddr %lx out of range %x - %x\n",
819 seg, (long)map->dm_segs[seg].ds_addr,
820 is->is_dvmabase, is->is_dvmaend);
821 Debugger();
822 }
823 }
824 }
825 #endif
826 return (0);
827 }
828 /*
829 * This was allocated with bus_dmamem_alloc.
830 * The pages are on an `mlist'.
831 */
832 map->dm_mapsize = size;
833 i = 0;
834 sgstart = dvmaddr;
835 sgend = sgstart + size - 1;
836 map->dm_segs[i].ds_addr = sgstart;
837 while ((sgstart & ~(boundary - 1)) != (sgend & ~(boundary - 1))) {
838 /* Oops. We crossed a boundary. Split the xfer. */
839 map->dm_segs[i].ds_len = boundary - (sgstart & (boundary - 1));
840 DPRINTF(IDB_INFO, ("iommu_dvmamap_load_raw: "
841 "seg %d start %lx size %lx\n", i,
842 (long)map->dm_segs[i].ds_addr,
843 (long)map->dm_segs[i].ds_len));
844 if (++i >= map->_dm_segcnt) {
845 /* Too many segments. Fail the operation. */
846 s = splhigh();
847 /* How can this fail? And if it does what can we do? */
848 err = extent_free(is->is_dvmamap,
849 dvmaddr, sgsize, EX_NOWAIT);
850 map->_dm_dvmastart = 0;
851 map->_dm_dvmasize = 0;
852 splx(s);
853 return (E2BIG);
854 }
855 sgstart = roundup(sgstart, boundary);
856 map->dm_segs[i].ds_addr = sgstart;
857 }
858 DPRINTF(IDB_INFO, ("iommu_dvmamap_load_raw: "
859 "seg %d start %lx size %lx\n", i,
860 (long)map->dm_segs[i].ds_addr, (long)map->dm_segs[i].ds_len));
861 map->dm_segs[i].ds_len = sgend - sgstart + 1;
862
863 for (m = TAILQ_FIRST(mlist); m != NULL; m = TAILQ_NEXT(m,pageq)) {
864 if (sgsize == 0)
865 panic("iommu_dmamap_load_raw: size botch");
866 pa = VM_PAGE_TO_PHYS(m);
867
868 DPRINTF(IDB_BUSDMA,
869 ("iommu_dvmamap_load_raw: map %p loading va %lx at pa %lx\n",
870 map, (long)dvmaddr, (long)(pa)));
871 iommu_enter(sb, dvmaddr, pa, flags|0x8000);
872
873 dvmaddr += pagesz;
874 sgsize -= pagesz;
875 }
876 map->dm_mapsize = size;
877 map->dm_nsegs = i+1;
878 #ifdef DIAGNOSTIC
879 { int seg;
880 for (seg = 0; seg < map->dm_nsegs; seg++) {
881 if (map->dm_segs[seg].ds_addr < is->is_dvmabase ||
882 map->dm_segs[seg].ds_addr > is->is_dvmaend) {
883 printf("seg %d dvmaddr %lx out of range %x - %x\n",
884 seg, (long)map->dm_segs[seg].ds_addr,
885 is->is_dvmabase, is->is_dvmaend);
886 Debugger();
887 }
888 }
889 }
890 #endif
891 return (0);
892 }
893
894 void
895 iommu_dvmamap_sync(t, sb, map, offset, len, ops)
896 bus_dma_tag_t t;
897 struct strbuf_ctl *sb;
898 bus_dmamap_t map;
899 bus_addr_t offset;
900 bus_size_t len;
901 int ops;
902 {
903 struct iommu_state *is = sb->sb_is;
904 vaddr_t va = map->dm_segs[0].ds_addr + offset;
905 int64_t tte;
906
907 /*
908 * We only support one DMA segment; supporting more makes this code
909 * too unweildy.
910 */
911
912 if (ops & BUS_DMASYNC_PREREAD) {
913 DPRINTF(IDB_SYNC,
914 ("iommu_dvmamap_sync: syncing va %p len %lu "
915 "BUS_DMASYNC_PREREAD\n", (void *)(u_long)va, (u_long)len));
916
917 /* Nothing to do */;
918 }
919 if (ops & BUS_DMASYNC_POSTREAD) {
920 DPRINTF(IDB_SYNC,
921 ("iommu_dvmamap_sync: syncing va %p len %lu "
922 "BUS_DMASYNC_POSTREAD\n", (void *)(u_long)va, (u_long)len));
923 #ifdef DIAGNOSTIC
924 if (va < is->is_dvmabase || va >= is->is_dvmaend)
925 panic("iommu_dvmamap_sync: invalid dva %lx", va);
926 #endif
927 tte = is->is_tsb[IOTSBSLOT(va, is->is_tsbsize)];
928
929 DPRINTF(IDB_SYNC,
930 ("iommu_dvmamap_sync: syncing va %p len %lu "
931 "BUS_DMASYNC_PREWRITE\n", (void *)(u_long)va, (u_long)len));
932
933 /* if we have a streaming buffer, flush it here first */
934 if ((tte & IOTTE_STREAM) && sb->sb_flush)
935 while (len > 0) {
936 DPRINTF(IDB_BUSDMA,
937 ("iommu_dvmamap_sync: flushing va %p, %lu "
938 "bytes left\n", (void *)(u_long)va,
939 (u_long)len));
940 iommu_strbuf_flush(sb, va);
941 if (len <= NBPG) {
942 iommu_strbuf_flush_done(sb);
943 len = 0;
944 } else
945 len -= NBPG;
946 va += NBPG;
947 }
948 }
949 if (ops & BUS_DMASYNC_PREWRITE) {
950 #ifdef DIAGNOSTIC
951 if (va < is->is_dvmabase || va >= is->is_dvmaend)
952 panic("iommu_dvmamap_sync: invalid dva %lx", va);
953 #endif
954 tte = is->is_tsb[IOTSBSLOT(va, is->is_tsbsize)];
955
956 DPRINTF(IDB_SYNC,
957 ("iommu_dvmamap_sync: syncing va %p len %lu "
958 "BUS_DMASYNC_PREWRITE\n", (void *)(u_long)va, (u_long)len));
959
960 /* if we have a streaming buffer, flush it here first */
961 if ((tte & IOTTE_STREAM) && sb->sb_flush)
962 while (len > 0) {
963 DPRINTF(IDB_BUSDMA,
964 ("iommu_dvmamap_sync: flushing va %p, %lu "
965 "bytes left\n", (void *)(u_long)va,
966 (u_long)len));
967 iommu_strbuf_flush(sb, va);
968 if (len <= NBPG) {
969 iommu_strbuf_flush_done(sb);
970 len = 0;
971 } else
972 len -= NBPG;
973 va += NBPG;
974 }
975 }
976 if (ops & BUS_DMASYNC_POSTWRITE) {
977 DPRINTF(IDB_SYNC,
978 ("iommu_dvmamap_sync: syncing va %p len %lu "
979 "BUS_DMASYNC_POSTWRITE\n", (void *)(u_long)va, (u_long)len));
980 /* Nothing to do */;
981 }
982 }
983
984 int
985 iommu_dvmamem_alloc(t, sb, size, alignment, boundary, segs, nsegs, rsegs, flags)
986 bus_dma_tag_t t;
987 struct strbuf_ctl *sb;
988 bus_size_t size, alignment, boundary;
989 bus_dma_segment_t *segs;
990 int nsegs;
991 int *rsegs;
992 int flags;
993 {
994
995 DPRINTF(IDB_BUSDMA, ("iommu_dvmamem_alloc: sz %llx align %llx bound %llx "
996 "segp %p flags %d\n", (unsigned long long)size,
997 (unsigned long long)alignment, (unsigned long long)boundary,
998 segs, flags));
999 return (bus_dmamem_alloc(t->_parent, size, alignment, boundary,
1000 segs, nsegs, rsegs, flags|BUS_DMA_DVMA));
1001 }
1002
1003 void
1004 iommu_dvmamem_free(t, sb, segs, nsegs)
1005 bus_dma_tag_t t;
1006 struct strbuf_ctl *sb;
1007 bus_dma_segment_t *segs;
1008 int nsegs;
1009 {
1010
1011 DPRINTF(IDB_BUSDMA, ("iommu_dvmamem_free: segp %p nsegs %d\n",
1012 segs, nsegs));
1013 bus_dmamem_free(t->_parent, segs, nsegs);
1014 }
1015
1016 /*
1017 * Map the DVMA mappings into the kernel pmap.
1018 * Check the flags to see whether we're streaming or coherent.
1019 */
1020 int
1021 iommu_dvmamem_map(t, sb, segs, nsegs, size, kvap, flags)
1022 bus_dma_tag_t t;
1023 struct strbuf_ctl *sb;
1024 bus_dma_segment_t *segs;
1025 int nsegs;
1026 size_t size;
1027 caddr_t *kvap;
1028 int flags;
1029 {
1030 struct vm_page *m;
1031 vaddr_t va;
1032 bus_addr_t addr;
1033 struct pglist *mlist;
1034 int cbit;
1035
1036 DPRINTF(IDB_BUSDMA, ("iommu_dvmamem_map: segp %p nsegs %d size %lx\n",
1037 segs, nsegs, size));
1038
1039 /*
1040 * Allocate some space in the kernel map, and then map these pages
1041 * into this space.
1042 */
1043 size = round_page(size);
1044 va = uvm_km_valloc(kernel_map, size);
1045 if (va == 0)
1046 return (ENOMEM);
1047
1048 *kvap = (caddr_t)va;
1049
1050 /*
1051 * digest flags:
1052 */
1053 cbit = 0;
1054 if (flags & BUS_DMA_COHERENT) /* Disable vcache */
1055 cbit |= PMAP_NVC;
1056 if (flags & BUS_DMA_NOCACHE) /* sideffects */
1057 cbit |= PMAP_NC;
1058
1059 /*
1060 * Now take this and map it into the CPU.
1061 */
1062 mlist = segs[0]._ds_mlist;
1063 for (m = mlist->tqh_first; m != NULL; m = m->pageq.tqe_next) {
1064 #ifdef DIAGNOSTIC
1065 if (size == 0)
1066 panic("iommu_dvmamem_map: size botch");
1067 #endif
1068 addr = VM_PAGE_TO_PHYS(m);
1069 DPRINTF(IDB_BUSDMA, ("iommu_dvmamem_map: "
1070 "mapping va %lx at %llx\n", va, (unsigned long long)addr | cbit));
1071 pmap_enter(pmap_kernel(), va, addr | cbit,
1072 VM_PROT_READ | VM_PROT_WRITE,
1073 VM_PROT_READ | VM_PROT_WRITE | PMAP_WIRED);
1074 va += PAGE_SIZE;
1075 size -= PAGE_SIZE;
1076 }
1077 pmap_update(pmap_kernel());
1078
1079 return (0);
1080 }
1081
1082 /*
1083 * Unmap DVMA mappings from kernel
1084 */
1085 void
1086 iommu_dvmamem_unmap(t, sb, kva, size)
1087 bus_dma_tag_t t;
1088 struct strbuf_ctl *sb;
1089 caddr_t kva;
1090 size_t size;
1091 {
1092
1093 DPRINTF(IDB_BUSDMA, ("iommu_dvmamem_unmap: kvm %p size %lx\n",
1094 kva, size));
1095
1096 #ifdef DIAGNOSTIC
1097 if ((u_long)kva & PGOFSET)
1098 panic("iommu_dvmamem_unmap");
1099 #endif
1100
1101 size = round_page(size);
1102 pmap_remove(pmap_kernel(), (vaddr_t)kva, size);
1103 pmap_update(pmap_kernel());
1104 #if 0
1105 /*
1106 * XXX ? is this necessary? i think so and i think other
1107 * implementations are missing it.
1108 */
1109 uvm_km_free(kernel_map, (vaddr_t)kva, size);
1110 #endif
1111 }
1112