iommu.c revision 1.108 1 1.108 palle /* $NetBSD: iommu.c,v 1.108 2014/08/24 19:09:43 palle Exp $ */
2 1.82 mrg
3 1.82 mrg /*
4 1.82 mrg * Copyright (c) 1999, 2000 Matthew R. Green
5 1.82 mrg * All rights reserved.
6 1.82 mrg *
7 1.82 mrg * Redistribution and use in source and binary forms, with or without
8 1.82 mrg * modification, are permitted provided that the following conditions
9 1.82 mrg * are met:
10 1.82 mrg * 1. Redistributions of source code must retain the above copyright
11 1.82 mrg * notice, this list of conditions and the following disclaimer.
12 1.82 mrg * 2. Redistributions in binary form must reproduce the above copyright
13 1.82 mrg * notice, this list of conditions and the following disclaimer in the
14 1.82 mrg * documentation and/or other materials provided with the distribution.
15 1.82 mrg *
16 1.82 mrg * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
17 1.82 mrg * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
18 1.82 mrg * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
19 1.82 mrg * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
20 1.82 mrg * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
21 1.82 mrg * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
22 1.82 mrg * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
23 1.82 mrg * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
24 1.82 mrg * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25 1.82 mrg * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26 1.82 mrg * SUCH DAMAGE.
27 1.82 mrg */
28 1.7 mrg
29 1.7 mrg /*
30 1.48 eeh * Copyright (c) 2001, 2002 Eduardo Horvath
31 1.7 mrg * All rights reserved.
32 1.7 mrg *
33 1.7 mrg * Redistribution and use in source and binary forms, with or without
34 1.7 mrg * modification, are permitted provided that the following conditions
35 1.7 mrg * are met:
36 1.7 mrg * 1. Redistributions of source code must retain the above copyright
37 1.7 mrg * notice, this list of conditions and the following disclaimer.
38 1.7 mrg * 2. Redistributions in binary form must reproduce the above copyright
39 1.7 mrg * notice, this list of conditions and the following disclaimer in the
40 1.7 mrg * documentation and/or other materials provided with the distribution.
41 1.7 mrg * 3. The name of the author may not be used to endorse or promote products
42 1.7 mrg * derived from this software without specific prior written permission.
43 1.7 mrg *
44 1.7 mrg * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
45 1.7 mrg * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
46 1.7 mrg * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
47 1.7 mrg * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
48 1.7 mrg * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
49 1.7 mrg * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
50 1.7 mrg * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
51 1.7 mrg * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
52 1.7 mrg * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
53 1.7 mrg * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
54 1.7 mrg * SUCH DAMAGE.
55 1.7 mrg */
56 1.1 mrg
57 1.7 mrg /*
58 1.7 mrg * UltraSPARC IOMMU support; used by both the sbus and pci code.
59 1.7 mrg */
60 1.66 lukem
61 1.66 lukem #include <sys/cdefs.h>
62 1.108 palle __KERNEL_RCSID(0, "$NetBSD: iommu.c,v 1.108 2014/08/24 19:09:43 palle Exp $");
63 1.66 lukem
64 1.4 mrg #include "opt_ddb.h"
65 1.4 mrg
66 1.1 mrg #include <sys/param.h>
67 1.1 mrg #include <sys/extent.h>
68 1.1 mrg #include <sys/malloc.h>
69 1.1 mrg #include <sys/systm.h>
70 1.1 mrg #include <sys/device.h>
71 1.41 chs #include <sys/proc.h>
72 1.18 mrg
73 1.100 uebayasi #include <uvm/uvm.h>
74 1.1 mrg
75 1.104 dyoung #include <sys/bus.h>
76 1.1 mrg #include <sparc64/dev/iommureg.h>
77 1.1 mrg #include <sparc64/dev/iommuvar.h>
78 1.1 mrg
79 1.1 mrg #include <machine/autoconf.h>
80 1.1 mrg #include <machine/cpu.h>
81 1.1 mrg
82 1.1 mrg #ifdef DEBUG
83 1.22 mrg #define IDB_BUSDMA 0x1
84 1.22 mrg #define IDB_IOMMU 0x2
85 1.22 mrg #define IDB_INFO 0x4
86 1.36 eeh #define IDB_SYNC 0x8
87 1.10 mrg int iommudebug = 0x0;
88 1.4 mrg #define DPRINTF(l, s) do { if (iommudebug & l) printf s; } while (0)
89 1.90 nakayama #define IOTTE_DEBUG(n) (n)
90 1.4 mrg #else
91 1.4 mrg #define DPRINTF(l, s)
92 1.90 nakayama #define IOTTE_DEBUG(n) 0
93 1.1 mrg #endif
94 1.1 mrg
95 1.55 eeh #define iommu_strbuf_flush(i, v) do { \
96 1.55 eeh if ((i)->sb_flush) \
97 1.55 eeh bus_space_write_8((i)->sb_is->is_bustag, (i)->sb_sb, \
98 1.50 eeh STRBUFREG(strbuf_pgflush), (v)); \
99 1.42 eeh } while (0)
100 1.42 eeh
101 1.78 cdi static int iommu_strbuf_flush_done(struct strbuf_ctl *);
102 1.85 nakayama static void _iommu_dvmamap_sync(bus_dma_tag_t, bus_dmamap_t, bus_addr_t,
103 1.85 nakayama bus_size_t, int);
104 1.11 eeh
105 1.1 mrg /*
106 1.1 mrg * initialise the UltraSPARC IOMMU (SBUS or PCI):
107 1.1 mrg * - allocate and setup the iotsb.
108 1.1 mrg * - enable the IOMMU
109 1.7 mrg * - initialise the streaming buffers (if they exist)
110 1.1 mrg * - create a private DVMA map.
111 1.1 mrg */
112 1.1 mrg void
113 1.79 cdi iommu_init(char *name, struct iommu_state *is, int tsbsize, uint32_t iovabase)
114 1.1 mrg {
115 1.11 eeh psize_t size;
116 1.11 eeh vaddr_t va;
117 1.11 eeh paddr_t pa;
118 1.58 chs struct vm_page *pg;
119 1.58 chs struct pglist pglist;
120 1.1 mrg
121 1.1 mrg /*
122 1.1 mrg * Setup the iommu.
123 1.1 mrg *
124 1.45 eeh * The sun4u iommu is part of the SBUS or PCI controller so we will
125 1.45 eeh * deal with it here..
126 1.1 mrg *
127 1.45 eeh * For sysio and psycho/psycho+ the IOMMU address space always ends at
128 1.45 eeh * 0xffffe000, but the starting address depends on the size of the
129 1.45 eeh * map. The map size is 1024 * 2 ^ is->is_tsbsize entries, where each
130 1.45 eeh * entry is 8 bytes. The start of the map can be calculated by
131 1.45 eeh * (0xffffe000 << (8 + is->is_tsbsize)).
132 1.45 eeh *
133 1.45 eeh * But sabre and hummingbird use a different scheme that seems to
134 1.45 eeh * be hard-wired, so we read the start and size from the PROM and
135 1.45 eeh * just use those values.
136 1.2 eeh */
137 1.108 palle if (strncmp(name, "pyro", 4) == 0) {
138 1.108 palle is->is_cr = IOMMUREG_READ(is, iommu_cr);
139 1.108 palle is->is_cr &= ~IOMMUCR_FIRE_BE;
140 1.108 palle is->is_cr |= (IOMMUCR_FIRE_SE | IOMMUCR_FIRE_CM_EN |
141 1.108 palle IOMMUCR_FIRE_TE);
142 1.108 palle } else
143 1.108 palle is->is_cr = IOMMUCR_EN;
144 1.11 eeh is->is_tsbsize = tsbsize;
145 1.45 eeh if (iovabase == -1) {
146 1.45 eeh is->is_dvmabase = IOTSB_VSTART(is->is_tsbsize);
147 1.90 nakayama is->is_dvmaend = IOTSB_VEND - 1;
148 1.45 eeh } else {
149 1.45 eeh is->is_dvmabase = iovabase;
150 1.90 nakayama is->is_dvmaend = iovabase + IOTSB_VSIZE(tsbsize) - 1;
151 1.45 eeh }
152 1.11 eeh
153 1.11 eeh /*
154 1.15 eeh * Allocate memory for I/O pagetables. They need to be physically
155 1.15 eeh * contiguous.
156 1.11 eeh */
157 1.11 eeh
158 1.64 thorpej size = PAGE_SIZE << is->is_tsbsize;
159 1.11 eeh if (uvm_pglistalloc((psize_t)size, (paddr_t)0, (paddr_t)-1,
160 1.64 thorpej (paddr_t)PAGE_SIZE, (paddr_t)0, &pglist, 1, 0) != 0)
161 1.11 eeh panic("iommu_init: no memory");
162 1.11 eeh
163 1.76 yamt va = uvm_km_alloc(kernel_map, size, 0, UVM_KMF_VAONLY);
164 1.11 eeh if (va == 0)
165 1.11 eeh panic("iommu_init: no memory");
166 1.11 eeh is->is_tsb = (int64_t *)va;
167 1.11 eeh
168 1.58 chs is->is_ptsb = VM_PAGE_TO_PHYS(TAILQ_FIRST(&pglist));
169 1.11 eeh
170 1.11 eeh /* Map the pages */
171 1.83 ad TAILQ_FOREACH(pg, &pglist, pageq.queue) {
172 1.58 chs pa = VM_PAGE_TO_PHYS(pg);
173 1.88 cegger pmap_kenter_pa(va, pa | PMAP_NVC,
174 1.88 cegger VM_PROT_READ | VM_PROT_WRITE, 0);
175 1.64 thorpej va += PAGE_SIZE;
176 1.11 eeh }
177 1.38 chris pmap_update(pmap_kernel());
178 1.58 chs memset(is->is_tsb, 0, size);
179 1.1 mrg
180 1.1 mrg #ifdef DEBUG
181 1.102 mrg if (iommudebug & IDB_INFO)
182 1.1 mrg {
183 1.1 mrg /* Probe the iommu */
184 1.1 mrg
185 1.50 eeh printf("iommu cr=%llx tsb=%llx\n",
186 1.50 eeh (unsigned long long)bus_space_read_8(is->is_bustag,
187 1.50 eeh is->is_iommu,
188 1.103 mrg offsetof(struct iommureg, iommu_cr)),
189 1.50 eeh (unsigned long long)bus_space_read_8(is->is_bustag,
190 1.50 eeh is->is_iommu,
191 1.103 mrg offsetof(struct iommureg, iommu_tsb)));
192 1.58 chs printf("TSB base %p phys %llx\n", (void *)is->is_tsb,
193 1.50 eeh (unsigned long long)is->is_ptsb);
194 1.1 mrg delay(1000000); /* 1 s */
195 1.1 mrg }
196 1.1 mrg #endif
197 1.1 mrg
198 1.1 mrg /*
199 1.1 mrg * Now all the hardware's working we need to allocate a dvma map.
200 1.1 mrg */
201 1.98 mrg aprint_debug("DVMA map: %x to %x\n",
202 1.11 eeh (unsigned int)is->is_dvmabase,
203 1.45 eeh (unsigned int)is->is_dvmaend);
204 1.98 mrg aprint_debug("IOTSB: %llx to %llx\n",
205 1.47 eeh (unsigned long long)is->is_ptsb,
206 1.90 nakayama (unsigned long long)(is->is_ptsb + size - 1));
207 1.1 mrg is->is_dvmamap = extent_create(name,
208 1.90 nakayama is->is_dvmabase, is->is_dvmaend,
209 1.106 para 0, 0, EX_NOWAIT);
210 1.99 mrg /* XXXMRG Check is_dvmamap is valid. */
211 1.103 mrg
212 1.107 mrg mutex_init(&is->is_lock, MUTEX_DEFAULT, IPL_HIGH);
213 1.107 mrg
214 1.103 mrg /*
215 1.103 mrg * Set the TSB size. The relevant bits were moved to the TSB
216 1.103 mrg * base register in the PCIe host bridges.
217 1.103 mrg */
218 1.103 mrg if (is->is_flags & IOMMU_TSBSIZE_IN_PTSB)
219 1.103 mrg is->is_ptsb |= is->is_tsbsize;
220 1.103 mrg else
221 1.103 mrg is->is_cr |= (is->is_tsbsize << 16);
222 1.103 mrg
223 1.103 mrg /*
224 1.103 mrg * now actually start up the IOMMU
225 1.103 mrg */
226 1.103 mrg iommu_reset(is);
227 1.1 mrg }
228 1.1 mrg
229 1.8 mrg /*
230 1.8 mrg * Streaming buffers don't exist on the UltraSPARC IIi; we should have
231 1.8 mrg * detected that already and disabled them. If not, we will notice that
232 1.8 mrg * they aren't there when the STRBUF_EN bit does not remain.
233 1.8 mrg */
234 1.1 mrg void
235 1.78 cdi iommu_reset(struct iommu_state *is)
236 1.1 mrg {
237 1.45 eeh int i;
238 1.55 eeh struct strbuf_ctl *sb;
239 1.1 mrg
240 1.103 mrg IOMMUREG_WRITE(is, iommu_tsb, is->is_ptsb);
241 1.50 eeh
242 1.11 eeh /* Enable IOMMU in diagnostic mode */
243 1.103 mrg IOMMUREG_WRITE(is, iommu_cr, is->is_cr|IOMMUCR_DE);
244 1.11 eeh
245 1.58 chs for (i = 0; i < 2; i++) {
246 1.55 eeh if ((sb = is->is_sb[i])) {
247 1.5 mrg
248 1.45 eeh /* Enable diagnostics mode? */
249 1.58 chs bus_space_write_8(is->is_bustag, is->is_sb[i]->sb_sb,
250 1.50 eeh STRBUFREG(strbuf_ctl), STRBUF_EN);
251 1.45 eeh
252 1.105 nakayama membar_Lookaside();
253 1.103 mrg
254 1.45 eeh /* No streaming buffers? Disable them */
255 1.58 chs if (bus_space_read_8(is->is_bustag,
256 1.58 chs is->is_sb[i]->sb_sb,
257 1.55 eeh STRBUFREG(strbuf_ctl)) == 0) {
258 1.55 eeh is->is_sb[i]->sb_flush = NULL;
259 1.55 eeh } else {
260 1.58 chs
261 1.55 eeh /*
262 1.55 eeh * locate the pa of the flush buffer.
263 1.55 eeh */
264 1.103 mrg if (pmap_extract(pmap_kernel(),
265 1.103 mrg (vaddr_t)is->is_sb[i]->sb_flush,
266 1.103 mrg &is->is_sb[i]->sb_flushpa) == FALSE)
267 1.103 mrg is->is_sb[i]->sb_flush = NULL;
268 1.55 eeh }
269 1.45 eeh }
270 1.42 eeh }
271 1.103 mrg
272 1.103 mrg if (is->is_flags & IOMMU_FLUSH_CACHE)
273 1.103 mrg IOMMUREG_WRITE(is, iommu_cache_invalidate, -1ULL);
274 1.2 eeh }
275 1.2 eeh
276 1.2 eeh /*
277 1.58 chs * Here are the iommu control routines.
278 1.2 eeh */
279 1.2 eeh void
280 1.78 cdi iommu_enter(struct strbuf_ctl *sb, vaddr_t va, int64_t pa, int flags)
281 1.2 eeh {
282 1.55 eeh struct iommu_state *is = sb->sb_is;
283 1.55 eeh int strbuf = (flags & BUS_DMA_STREAMING);
284 1.2 eeh int64_t tte;
285 1.2 eeh
286 1.2 eeh #ifdef DIAGNOSTIC
287 1.45 eeh if (va < is->is_dvmabase || va > is->is_dvmaend)
288 1.13 mrg panic("iommu_enter: va %#lx not in DVMA space", va);
289 1.2 eeh #endif
290 1.2 eeh
291 1.55 eeh /* Is the streamcache flush really needed? */
292 1.91 nakayama if (sb->sb_flush)
293 1.55 eeh iommu_strbuf_flush(sb, va);
294 1.91 nakayama else
295 1.55 eeh /* If we can't flush the strbuf don't enable it. */
296 1.55 eeh strbuf = 0;
297 1.55 eeh
298 1.58 chs tte = MAKEIOTTE(pa, !(flags & BUS_DMA_NOWRITE),
299 1.55 eeh !(flags & BUS_DMA_NOCACHE), (strbuf));
300 1.50 eeh #ifdef DEBUG
301 1.50 eeh tte |= (flags & 0xff000LL)<<(4*8);
302 1.50 eeh #endif
303 1.58 chs
304 1.2 eeh is->is_tsb[IOTSBSLOT(va,is->is_tsbsize)] = tte;
305 1.58 chs bus_space_write_8(is->is_bustag, is->is_iommu,
306 1.50 eeh IOMMUREG(iommu_flush), va);
307 1.103 mrg DPRINTF(IDB_IOMMU, ("iommu_enter: slot %d va %lx pa %lx "
308 1.103 mrg "TSB[%lx]@%p=%lx\n", (int)IOTSBSLOT(va,is->is_tsbsize),
309 1.50 eeh va, (long)pa, (u_long)IOTSBSLOT(va,is->is_tsbsize),
310 1.50 eeh (void *)(u_long)&is->is_tsb[IOTSBSLOT(va,is->is_tsbsize)],
311 1.50 eeh (u_long)tte));
312 1.39 eeh }
313 1.39 eeh
314 1.39 eeh /*
315 1.39 eeh * Find the value of a DVMA address (debug routine).
316 1.39 eeh */
317 1.39 eeh paddr_t
318 1.78 cdi iommu_extract(struct iommu_state *is, vaddr_t dva)
319 1.39 eeh {
320 1.39 eeh int64_t tte = 0;
321 1.58 chs
322 1.90 nakayama if (dva >= is->is_dvmabase && dva <= is->is_dvmaend)
323 1.55 eeh tte = is->is_tsb[IOTSBSLOT(dva, is->is_tsbsize)];
324 1.39 eeh
325 1.54 eeh if ((tte & IOTTE_V) == 0)
326 1.39 eeh return ((paddr_t)-1L);
327 1.54 eeh return (tte & IOTTE_PAMASK);
328 1.2 eeh }
329 1.2 eeh
330 1.2 eeh /*
331 1.2 eeh * iommu_remove: removes mappings created by iommu_enter
332 1.2 eeh *
333 1.2 eeh * Only demap from IOMMU if flag is set.
334 1.8 mrg *
335 1.8 mrg * XXX: this function needs better internal error checking.
336 1.2 eeh */
337 1.2 eeh void
338 1.78 cdi iommu_remove(struct iommu_state *is, vaddr_t va, size_t len)
339 1.2 eeh {
340 1.103 mrg int slot;
341 1.2 eeh
342 1.2 eeh #ifdef DIAGNOSTIC
343 1.45 eeh if (va < is->is_dvmabase || va > is->is_dvmaend)
344 1.25 mrg panic("iommu_remove: va 0x%lx not in DVMA space", (u_long)va);
345 1.2 eeh if ((long)(va + len) < (long)va)
346 1.58 chs panic("iommu_remove: va 0x%lx + len 0x%lx wraps",
347 1.2 eeh (long) va, (long) len);
348 1.58 chs if (len & ~0xfffffff)
349 1.72 snj panic("iommu_remove: ridiculous len 0x%lx", (u_long)len);
350 1.2 eeh #endif
351 1.2 eeh
352 1.2 eeh va = trunc_page(va);
353 1.22 mrg DPRINTF(IDB_IOMMU, ("iommu_remove: va %lx TSB[%lx]@%p\n",
354 1.50 eeh va, (u_long)IOTSBSLOT(va, is->is_tsbsize),
355 1.50 eeh &is->is_tsb[IOTSBSLOT(va, is->is_tsbsize)]));
356 1.2 eeh while (len > 0) {
357 1.50 eeh DPRINTF(IDB_IOMMU, ("iommu_remove: clearing TSB slot %d "
358 1.50 eeh "for va %p size %lx\n",
359 1.50 eeh (int)IOTSBSLOT(va,is->is_tsbsize), (void *)(u_long)va,
360 1.50 eeh (u_long)len));
361 1.64 thorpej if (len <= PAGE_SIZE)
362 1.10 mrg len = 0;
363 1.10 mrg else
364 1.64 thorpej len -= PAGE_SIZE;
365 1.8 mrg
366 1.99 mrg #if 0
367 1.94 nakayama /*
368 1.94 nakayama * XXX Zero-ing the entry would not require RMW
369 1.94 nakayama *
370 1.94 nakayama * Disabling valid bit while a page is used by a device
371 1.94 nakayama * causes an uncorrectable DMA error.
372 1.94 nakayama * Workaround to avoid an uncorrectable DMA error is
373 1.94 nakayama * eliminating the next line, but the page is mapped
374 1.94 nakayama * until the next iommu_enter call.
375 1.94 nakayama */
376 1.47 eeh is->is_tsb[IOTSBSLOT(va,is->is_tsbsize)] &= ~IOTTE_V;
377 1.105 nakayama membar_StoreStore();
378 1.99 mrg #endif
379 1.103 mrg IOMMUREG_WRITE(is, iommu_flush, va);
380 1.103 mrg
381 1.103 mrg /* Flush cache if necessary. */
382 1.103 mrg slot = IOTSBSLOT(trunc_page(va), is->is_tsbsize);
383 1.103 mrg if ((is->is_flags & IOMMU_FLUSH_CACHE) &&
384 1.103 mrg (len == 0 || (slot % 8) == 7))
385 1.103 mrg IOMMUREG_WRITE(is, iommu_cache_flush,
386 1.103 mrg is->is_ptsb + slot * 8);
387 1.103 mrg
388 1.64 thorpej va += PAGE_SIZE;
389 1.2 eeh }
390 1.2 eeh }
391 1.2 eeh
392 1.58 chs static int
393 1.78 cdi iommu_strbuf_flush_done(struct strbuf_ctl *sb)
394 1.2 eeh {
395 1.55 eeh struct iommu_state *is = sb->sb_is;
396 1.2 eeh struct timeval cur, flushtimeout;
397 1.2 eeh
398 1.2 eeh #define BUMPTIME(t, usec) { \
399 1.2 eeh register volatile struct timeval *tp = (t); \
400 1.2 eeh register long us; \
401 1.2 eeh \
402 1.2 eeh tp->tv_usec = us = tp->tv_usec + (usec); \
403 1.2 eeh if (us >= 1000000) { \
404 1.2 eeh tp->tv_usec = us - 1000000; \
405 1.2 eeh tp->tv_sec++; \
406 1.2 eeh } \
407 1.2 eeh }
408 1.5 mrg
409 1.55 eeh if (!sb->sb_flush)
410 1.5 mrg return (0);
411 1.58 chs
412 1.7 mrg /*
413 1.7 mrg * Streaming buffer flushes:
414 1.58 chs *
415 1.7 mrg * 1 Tell strbuf to flush by storing va to strbuf_pgflush. If
416 1.7 mrg * we're not on a cache line boundary (64-bits):
417 1.7 mrg * 2 Store 0 in flag
418 1.7 mrg * 3 Store pointer to flag in flushsync
419 1.7 mrg * 4 wait till flushsync becomes 0x1
420 1.7 mrg *
421 1.7 mrg * If it takes more than .5 sec, something
422 1.7 mrg * went wrong.
423 1.7 mrg */
424 1.2 eeh
425 1.55 eeh *sb->sb_flush = 0;
426 1.58 chs bus_space_write_8(is->is_bustag, sb->sb_sb,
427 1.55 eeh STRBUFREG(strbuf_flushsync), sb->sb_flushpa);
428 1.2 eeh
429 1.58 chs microtime(&flushtimeout);
430 1.2 eeh cur = flushtimeout;
431 1.2 eeh BUMPTIME(&flushtimeout, 500000); /* 1/2 sec */
432 1.58 chs
433 1.103 mrg DPRINTF(IDB_IOMMU, ("%s: flush = %lx at va = %lx pa = %lx now="
434 1.103 mrg "%"PRIx64":%"PRIx32" until = %"PRIx64":%"PRIx32"\n", __func__,
435 1.58 chs (long)*sb->sb_flush, (long)sb->sb_flush, (long)sb->sb_flushpa,
436 1.42 eeh cur.tv_sec, cur.tv_usec,
437 1.42 eeh flushtimeout.tv_sec, flushtimeout.tv_usec));
438 1.42 eeh
439 1.2 eeh /* Bypass non-coherent D$ */
440 1.55 eeh while ((!ldxa(sb->sb_flushpa, ASI_PHYS_CACHED)) &&
441 1.98 mrg timercmp(&cur, &flushtimeout, <=))
442 1.2 eeh microtime(&cur);
443 1.2 eeh
444 1.2 eeh #ifdef DIAGNOSTIC
445 1.55 eeh if (!ldxa(sb->sb_flushpa, ASI_PHYS_CACHED)) {
446 1.103 mrg printf("%s: flush timeout %p, at %p\n", __func__,
447 1.55 eeh (void *)(u_long)*sb->sb_flush,
448 1.55 eeh (void *)(u_long)sb->sb_flushpa); /* panic? */
449 1.2 eeh #ifdef DDB
450 1.2 eeh Debugger();
451 1.2 eeh #endif
452 1.2 eeh }
453 1.2 eeh #endif
454 1.103 mrg DPRINTF(IDB_IOMMU, ("%s: flushed\n", __func__));
455 1.55 eeh return (*sb->sb_flush);
456 1.7 mrg }
457 1.7 mrg
458 1.7 mrg /*
459 1.7 mrg * IOMMU DVMA operations, common to SBUS and PCI.
460 1.7 mrg */
461 1.7 mrg int
462 1.85 nakayama iommu_dvmamap_load(bus_dma_tag_t t, bus_dmamap_t map, void *buf,
463 1.85 nakayama bus_size_t buflen, struct proc *p, int flags)
464 1.7 mrg {
465 1.85 nakayama struct strbuf_ctl *sb = (struct strbuf_ctl *)map->_dm_cookie;
466 1.55 eeh struct iommu_state *is = sb->sb_is;
467 1.91 nakayama int err, needsflush;
468 1.7 mrg bus_size_t sgsize;
469 1.7 mrg paddr_t curaddr;
470 1.90 nakayama u_long dvmaddr, sgstart, sgend, bmask;
471 1.71 tsutsui bus_size_t align, boundary, len;
472 1.7 mrg vaddr_t vaddr = (vaddr_t)buf;
473 1.40 eeh int seg;
474 1.58 chs struct pmap *pmap;
475 1.103 mrg int slot;
476 1.7 mrg
477 1.7 mrg if (map->dm_nsegs) {
478 1.7 mrg /* Already in use?? */
479 1.7 mrg #ifdef DIAGNOSTIC
480 1.7 mrg printf("iommu_dvmamap_load: map still in use\n");
481 1.7 mrg #endif
482 1.7 mrg bus_dmamap_unload(t, map);
483 1.7 mrg }
484 1.58 chs
485 1.7 mrg /*
486 1.7 mrg * Make sure that on error condition we return "no valid mappings".
487 1.7 mrg */
488 1.7 mrg map->dm_nsegs = 0;
489 1.96 nakayama KASSERT(map->dm_maxsegsz <= map->_dm_maxmaxsegsz);
490 1.96 nakayama
491 1.7 mrg if (buflen > map->_dm_size) {
492 1.22 mrg DPRINTF(IDB_BUSDMA,
493 1.7 mrg ("iommu_dvmamap_load(): error %d > %d -- "
494 1.25 mrg "map size exceeded!\n", (int)buflen, (int)map->_dm_size));
495 1.7 mrg return (EINVAL);
496 1.7 mrg }
497 1.7 mrg
498 1.7 mrg sgsize = round_page(buflen + ((int)vaddr & PGOFSET));
499 1.20 mrg
500 1.7 mrg /*
501 1.21 eeh * A boundary presented to bus_dmamem_alloc() takes precedence
502 1.21 eeh * over boundary in the map.
503 1.7 mrg */
504 1.21 eeh if ((boundary = (map->dm_segs[0]._ds_boundary)) == 0)
505 1.21 eeh boundary = map->_dm_boundary;
506 1.64 thorpej align = max(map->dm_segs[0]._ds_align, PAGE_SIZE);
507 1.58 chs
508 1.58 chs /*
509 1.58 chs * If our segment size is larger than the boundary we need to
510 1.40 eeh * split the transfer up int little pieces ourselves.
511 1.40 eeh */
512 1.103 mrg KASSERT(is->is_dvmamap);
513 1.107 mrg mutex_enter(&is->is_lock);
514 1.58 chs err = extent_alloc(is->is_dvmamap, sgsize, align,
515 1.71 tsutsui (sgsize > boundary) ? 0 : boundary,
516 1.71 tsutsui EX_NOWAIT|EX_BOUNDZERO, &dvmaddr);
517 1.107 mrg mutex_exit(&is->is_lock);
518 1.7 mrg
519 1.7 mrg #ifdef DEBUG
520 1.71 tsutsui if (err || (dvmaddr == (u_long)-1)) {
521 1.7 mrg printf("iommu_dvmamap_load(): extent_alloc(%d, %x) failed!\n",
522 1.25 mrg (int)sgsize, flags);
523 1.40 eeh #ifdef DDB
524 1.7 mrg Debugger();
525 1.40 eeh #endif
526 1.58 chs }
527 1.58 chs #endif
528 1.11 eeh if (err != 0)
529 1.11 eeh return (err);
530 1.11 eeh
531 1.65 nakayama if (dvmaddr == (u_long)-1)
532 1.7 mrg return (ENOMEM);
533 1.7 mrg
534 1.40 eeh /* Set the active DVMA map */
535 1.40 eeh map->_dm_dvmastart = dvmaddr;
536 1.40 eeh map->_dm_dvmasize = sgsize;
537 1.40 eeh
538 1.40 eeh /*
539 1.40 eeh * Now split the DVMA range into segments, not crossing
540 1.40 eeh * the boundary.
541 1.40 eeh */
542 1.40 eeh seg = 0;
543 1.40 eeh sgstart = dvmaddr + (vaddr & PGOFSET);
544 1.40 eeh sgend = sgstart + buflen - 1;
545 1.40 eeh map->dm_segs[seg].ds_addr = sgstart;
546 1.71 tsutsui DPRINTF(IDB_INFO, ("iommu_dvmamap_load: boundary %lx boundary - 1 %lx "
547 1.71 tsutsui "~(boundary - 1) %lx\n", (long)boundary, (long)(boundary - 1),
548 1.71 tsutsui (long)~(boundary - 1)));
549 1.90 nakayama bmask = ~(boundary - 1);
550 1.96 nakayama while ((sgstart & bmask) != (sgend & bmask) ||
551 1.96 nakayama sgend - sgstart + 1 > map->dm_maxsegsz) {
552 1.96 nakayama /* Oops. We crossed a boundary or large seg. Split the xfer. */
553 1.96 nakayama len = map->dm_maxsegsz;
554 1.96 nakayama if ((sgstart & bmask) != (sgend & bmask))
555 1.96 nakayama len = min(len, boundary - (sgstart & (boundary - 1)));
556 1.71 tsutsui map->dm_segs[seg].ds_len = len;
557 1.40 eeh DPRINTF(IDB_INFO, ("iommu_dvmamap_load: "
558 1.71 tsutsui "seg %d start %lx size %lx\n", seg,
559 1.71 tsutsui (long)map->dm_segs[seg].ds_addr,
560 1.71 tsutsui (long)map->dm_segs[seg].ds_len));
561 1.53 eeh if (++seg >= map->_dm_segcnt) {
562 1.40 eeh /* Too many segments. Fail the operation. */
563 1.40 eeh DPRINTF(IDB_INFO, ("iommu_dvmamap_load: "
564 1.71 tsutsui "too many segments %d\n", seg));
565 1.107 mrg mutex_enter(&is->is_lock);
566 1.40 eeh err = extent_free(is->is_dvmamap,
567 1.71 tsutsui dvmaddr, sgsize, EX_NOWAIT);
568 1.40 eeh map->_dm_dvmastart = 0;
569 1.40 eeh map->_dm_dvmasize = 0;
570 1.107 mrg mutex_exit(&is->is_lock);
571 1.95 nakayama if (err != 0)
572 1.95 nakayama printf("warning: %s: %" PRId64
573 1.95 nakayama " of DVMA space lost\n", __func__, sgsize);
574 1.80 mrg return (EFBIG);
575 1.40 eeh }
576 1.71 tsutsui sgstart += len;
577 1.40 eeh map->dm_segs[seg].ds_addr = sgstart;
578 1.40 eeh }
579 1.40 eeh map->dm_segs[seg].ds_len = sgend - sgstart + 1;
580 1.40 eeh DPRINTF(IDB_INFO, ("iommu_dvmamap_load: "
581 1.71 tsutsui "seg %d start %lx size %lx\n", seg,
582 1.71 tsutsui (long)map->dm_segs[seg].ds_addr, (long)map->dm_segs[seg].ds_len));
583 1.71 tsutsui map->dm_nsegs = seg + 1;
584 1.7 mrg map->dm_mapsize = buflen;
585 1.7 mrg
586 1.7 mrg if (p != NULL)
587 1.7 mrg pmap = p->p_vmspace->vm_map.pmap;
588 1.7 mrg else
589 1.7 mrg pmap = pmap_kernel();
590 1.7 mrg
591 1.91 nakayama needsflush = 0;
592 1.7 mrg for (; buflen > 0; ) {
593 1.58 chs
594 1.7 mrg /*
595 1.7 mrg * Get the physical address for this page.
596 1.7 mrg */
597 1.7 mrg if (pmap_extract(pmap, (vaddr_t)vaddr, &curaddr) == FALSE) {
598 1.74 petrov #ifdef DIAGNOSTIC
599 1.74 petrov printf("iommu_dvmamap_load: pmap_extract failed %lx\n", vaddr);
600 1.74 petrov #endif
601 1.7 mrg bus_dmamap_unload(t, map);
602 1.7 mrg return (-1);
603 1.7 mrg }
604 1.7 mrg
605 1.7 mrg /*
606 1.7 mrg * Compute the segment size, and adjust counts.
607 1.7 mrg */
608 1.64 thorpej sgsize = PAGE_SIZE - ((u_long)vaddr & PGOFSET);
609 1.7 mrg if (buflen < sgsize)
610 1.7 mrg sgsize = buflen;
611 1.7 mrg
612 1.22 mrg DPRINTF(IDB_BUSDMA,
613 1.36 eeh ("iommu_dvmamap_load: map %p loading va %p "
614 1.71 tsutsui "dva %lx at pa %lx\n",
615 1.71 tsutsui map, (void *)vaddr, (long)dvmaddr,
616 1.87 nakayama (long)trunc_page(curaddr)));
617 1.55 eeh iommu_enter(sb, trunc_page(dvmaddr), trunc_page(curaddr),
618 1.90 nakayama flags | IOTTE_DEBUG(0x4000));
619 1.91 nakayama needsflush = 1;
620 1.58 chs
621 1.7 mrg vaddr += sgsize;
622 1.7 mrg buflen -= sgsize;
623 1.103 mrg
624 1.103 mrg /* Flush cache if necessary. */
625 1.103 mrg slot = IOTSBSLOT(trunc_page(dvmaddr), is->is_tsbsize);
626 1.103 mrg if ((is->is_flags & IOMMU_FLUSH_CACHE) &&
627 1.103 mrg (buflen <= 0 || (slot % 8) == 7))
628 1.103 mrg IOMMUREG_WRITE(is, iommu_cache_flush,
629 1.103 mrg is->is_ptsb + slot * 8);
630 1.103 mrg
631 1.103 mrg dvmaddr += PAGE_SIZE;
632 1.7 mrg }
633 1.91 nakayama if (needsflush)
634 1.91 nakayama iommu_strbuf_flush_done(sb);
635 1.45 eeh #ifdef DIAGNOSTIC
636 1.45 eeh for (seg = 0; seg < map->dm_nsegs; seg++) {
637 1.45 eeh if (map->dm_segs[seg].ds_addr < is->is_dvmabase ||
638 1.45 eeh map->dm_segs[seg].ds_addr > is->is_dvmaend) {
639 1.45 eeh printf("seg %d dvmaddr %lx out of range %x - %x\n",
640 1.71 tsutsui seg, (long)map->dm_segs[seg].ds_addr,
641 1.71 tsutsui is->is_dvmabase, is->is_dvmaend);
642 1.57 chs #ifdef DDB
643 1.45 eeh Debugger();
644 1.57 chs #endif
645 1.45 eeh }
646 1.45 eeh }
647 1.45 eeh #endif
648 1.7 mrg return (0);
649 1.7 mrg }
650 1.7 mrg
651 1.7 mrg
652 1.7 mrg void
653 1.85 nakayama iommu_dvmamap_unload(bus_dma_tag_t t, bus_dmamap_t map)
654 1.7 mrg {
655 1.85 nakayama struct strbuf_ctl *sb = (struct strbuf_ctl *)map->_dm_cookie;
656 1.55 eeh struct iommu_state *is = sb->sb_is;
657 1.107 mrg int error;
658 1.70 christos bus_size_t sgsize = map->_dm_dvmasize;
659 1.7 mrg
660 1.40 eeh /* Flush the iommu */
661 1.40 eeh #ifdef DEBUG
662 1.40 eeh if (!map->_dm_dvmastart) {
663 1.40 eeh printf("iommu_dvmamap_unload: No dvmastart is zero\n");
664 1.40 eeh #ifdef DDB
665 1.40 eeh Debugger();
666 1.40 eeh #endif
667 1.40 eeh }
668 1.40 eeh #endif
669 1.40 eeh iommu_remove(is, map->_dm_dvmastart, map->_dm_dvmasize);
670 1.7 mrg
671 1.23 eeh /* Flush the caches */
672 1.23 eeh bus_dmamap_unload(t->_parent, map);
673 1.23 eeh
674 1.107 mrg mutex_enter(&is->is_lock);
675 1.58 chs error = extent_free(is->is_dvmamap, map->_dm_dvmastart,
676 1.40 eeh map->_dm_dvmasize, EX_NOWAIT);
677 1.43 eeh map->_dm_dvmastart = 0;
678 1.43 eeh map->_dm_dvmasize = 0;
679 1.107 mrg mutex_exit(&is->is_lock);
680 1.7 mrg if (error != 0)
681 1.95 nakayama printf("warning: %s: %" PRId64 " of DVMA space lost\n",
682 1.95 nakayama __func__, sgsize);
683 1.40 eeh
684 1.40 eeh /* Clear the map */
685 1.9 eeh }
686 1.9 eeh
687 1.9 eeh
688 1.9 eeh int
689 1.85 nakayama iommu_dvmamap_load_raw(bus_dma_tag_t t, bus_dmamap_t map,
690 1.85 nakayama bus_dma_segment_t *segs, int nsegs, bus_size_t size, int flags)
691 1.9 eeh {
692 1.85 nakayama struct strbuf_ctl *sb = (struct strbuf_ctl *)map->_dm_cookie;
693 1.55 eeh struct iommu_state *is = sb->sb_is;
694 1.58 chs struct vm_page *pg;
695 1.107 mrg int i, j;
696 1.26 martin int left;
697 1.91 nakayama int err, needsflush;
698 1.9 eeh bus_size_t sgsize;
699 1.9 eeh paddr_t pa;
700 1.21 eeh bus_size_t boundary, align;
701 1.90 nakayama u_long dvmaddr, sgstart, sgend, bmask;
702 1.58 chs struct pglist *pglist;
703 1.90 nakayama const int pagesz = PAGE_SIZE;
704 1.103 mrg int slot;
705 1.90 nakayama #ifdef DEBUG
706 1.90 nakayama int npg = 0;
707 1.90 nakayama #endif
708 1.9 eeh
709 1.9 eeh if (map->dm_nsegs) {
710 1.9 eeh /* Already in use?? */
711 1.9 eeh #ifdef DIAGNOSTIC
712 1.9 eeh printf("iommu_dvmamap_load_raw: map still in use\n");
713 1.9 eeh #endif
714 1.9 eeh bus_dmamap_unload(t, map);
715 1.9 eeh }
716 1.40 eeh
717 1.40 eeh /*
718 1.40 eeh * A boundary presented to bus_dmamem_alloc() takes precedence
719 1.40 eeh * over boundary in the map.
720 1.40 eeh */
721 1.40 eeh if ((boundary = segs[0]._ds_boundary) == 0)
722 1.40 eeh boundary = map->_dm_boundary;
723 1.40 eeh
724 1.45 eeh align = max(segs[0]._ds_align, pagesz);
725 1.40 eeh
726 1.9 eeh /*
727 1.9 eeh * Make sure that on error condition we return "no valid mappings".
728 1.9 eeh */
729 1.9 eeh map->dm_nsegs = 0;
730 1.26 martin /* Count up the total number of pages we need */
731 1.93 nakayama pa = trunc_page(segs[0].ds_addr);
732 1.26 martin sgsize = 0;
733 1.40 eeh left = size;
734 1.93 nakayama for (i = 0; left > 0 && i < nsegs; i++) {
735 1.26 martin if (round_page(pa) != round_page(segs[i].ds_addr))
736 1.93 nakayama sgsize = round_page(sgsize) +
737 1.93 nakayama (segs[i].ds_addr & PGOFSET);
738 1.40 eeh sgsize += min(left, segs[i].ds_len);
739 1.40 eeh left -= segs[i].ds_len;
740 1.26 martin pa = segs[i].ds_addr + segs[i].ds_len;
741 1.26 martin }
742 1.93 nakayama sgsize = round_page(sgsize);
743 1.9 eeh
744 1.107 mrg mutex_enter(&is->is_lock);
745 1.58 chs /*
746 1.58 chs * If our segment size is larger than the boundary we need to
747 1.45 eeh * split the transfer up into little pieces ourselves.
748 1.9 eeh */
749 1.40 eeh err = extent_alloc(is->is_dvmamap, sgsize, align,
750 1.40 eeh (sgsize > boundary) ? 0 : boundary,
751 1.40 eeh ((flags & BUS_DMA_NOWAIT) == 0 ? EX_WAITOK : EX_NOWAIT) |
752 1.54 eeh EX_BOUNDZERO, &dvmaddr);
753 1.107 mrg mutex_exit(&is->is_lock);
754 1.9 eeh
755 1.9 eeh if (err != 0)
756 1.9 eeh return (err);
757 1.9 eeh
758 1.9 eeh #ifdef DEBUG
759 1.65 nakayama if (dvmaddr == (u_long)-1)
760 1.58 chs {
761 1.9 eeh printf("iommu_dvmamap_load_raw(): extent_alloc(%d, %x) failed!\n",
762 1.25 mrg (int)sgsize, flags);
763 1.57 chs #ifdef DDB
764 1.9 eeh Debugger();
765 1.57 chs #endif
766 1.58 chs }
767 1.58 chs #endif
768 1.65 nakayama if (dvmaddr == (u_long)-1)
769 1.9 eeh return (ENOMEM);
770 1.9 eeh
771 1.40 eeh /* Set the active DVMA map */
772 1.40 eeh map->_dm_dvmastart = dvmaddr;
773 1.40 eeh map->_dm_dvmasize = sgsize;
774 1.40 eeh
775 1.90 nakayama bmask = ~(boundary - 1);
776 1.58 chs if ((pglist = segs[0]._ds_mlist) == NULL) {
777 1.92 nakayama u_long prev_va = 0UL, last_va = dvmaddr;
778 1.45 eeh paddr_t prev_pa = 0;
779 1.45 eeh int end = 0, offset;
780 1.92 nakayama bus_size_t len = size;
781 1.45 eeh
782 1.26 martin /*
783 1.45 eeh * This segs is made up of individual physical
784 1.58 chs * segments, probably by _bus_dmamap_load_uio() or
785 1.26 martin * _bus_dmamap_load_mbuf(). Ignore the mlist and
786 1.45 eeh * load each one individually.
787 1.26 martin */
788 1.45 eeh j = 0;
789 1.91 nakayama needsflush = 0;
790 1.45 eeh for (i = 0; i < nsegs ; i++) {
791 1.40 eeh
792 1.45 eeh pa = segs[i].ds_addr;
793 1.45 eeh offset = (pa & PGOFSET);
794 1.45 eeh pa = trunc_page(pa);
795 1.45 eeh dvmaddr = trunc_page(dvmaddr);
796 1.92 nakayama left = min(len, segs[i].ds_len);
797 1.45 eeh
798 1.45 eeh DPRINTF(IDB_INFO, ("iommu_dvmamap_load_raw: converting "
799 1.58 chs "physseg %d start %lx size %lx\n", i,
800 1.61 martin (long)segs[i].ds_addr, (long)segs[i].ds_len));
801 1.26 martin
802 1.58 chs if ((pa == prev_pa) &&
803 1.47 eeh ((offset != 0) || (end != offset))) {
804 1.45 eeh /* We can re-use this mapping */
805 1.45 eeh dvmaddr = prev_va;
806 1.45 eeh }
807 1.29 martin
808 1.45 eeh sgstart = dvmaddr + offset;
809 1.45 eeh sgend = sgstart + left - 1;
810 1.26 martin
811 1.45 eeh /* Are the segments virtually adjacent? */
812 1.58 chs if ((j > 0) && (end == offset) &&
813 1.96 nakayama ((offset == 0) || (pa == prev_pa)) &&
814 1.96 nakayama (map->dm_segs[j-1].ds_len + left <=
815 1.96 nakayama map->dm_maxsegsz)) {
816 1.45 eeh /* Just append to the previous segment. */
817 1.45 eeh map->dm_segs[--j].ds_len += left;
818 1.93 nakayama /* Restore sgstart for boundary check */
819 1.93 nakayama sgstart = map->dm_segs[j].ds_addr;
820 1.45 eeh DPRINTF(IDB_INFO, ("iommu_dvmamap_load_raw: "
821 1.45 eeh "appending seg %d start %lx size %lx\n", j,
822 1.58 chs (long)map->dm_segs[j].ds_addr,
823 1.61 martin (long)map->dm_segs[j].ds_len));
824 1.45 eeh } else {
825 1.53 eeh if (j >= map->_dm_segcnt) {
826 1.92 nakayama iommu_remove(is, map->_dm_dvmastart,
827 1.92 nakayama last_va - map->_dm_dvmastart);
828 1.92 nakayama goto fail;
829 1.53 eeh }
830 1.45 eeh map->dm_segs[j].ds_addr = sgstart;
831 1.45 eeh map->dm_segs[j].ds_len = left;
832 1.45 eeh DPRINTF(IDB_INFO, ("iommu_dvmamap_load_raw: "
833 1.45 eeh "seg %d start %lx size %lx\n", j,
834 1.48 eeh (long)map->dm_segs[j].ds_addr,
835 1.61 martin (long)map->dm_segs[j].ds_len));
836 1.40 eeh }
837 1.45 eeh end = (offset + left) & PGOFSET;
838 1.40 eeh
839 1.40 eeh /* Check for boundary issues */
840 1.90 nakayama while ((sgstart & bmask) != (sgend & bmask)) {
841 1.40 eeh /* Need a new segment. */
842 1.40 eeh map->dm_segs[j].ds_len =
843 1.53 eeh boundary - (sgstart & (boundary - 1));
844 1.40 eeh DPRINTF(IDB_INFO, ("iommu_dvmamap_load_raw: "
845 1.40 eeh "seg %d start %lx size %lx\n", j,
846 1.58 chs (long)map->dm_segs[j].ds_addr,
847 1.61 martin (long)map->dm_segs[j].ds_len));
848 1.53 eeh if (++j >= map->_dm_segcnt) {
849 1.92 nakayama iommu_remove(is, map->_dm_dvmastart,
850 1.92 nakayama last_va - map->_dm_dvmastart);
851 1.92 nakayama goto fail;
852 1.40 eeh }
853 1.93 nakayama sgstart += map->dm_segs[j-1].ds_len;
854 1.40 eeh map->dm_segs[j].ds_addr = sgstart;
855 1.40 eeh map->dm_segs[j].ds_len = sgend - sgstart + 1;
856 1.40 eeh }
857 1.40 eeh
858 1.26 martin if (sgsize == 0)
859 1.26 martin panic("iommu_dmamap_load_raw: size botch");
860 1.40 eeh
861 1.45 eeh /* Now map a series of pages. */
862 1.51 eeh while (dvmaddr <= sgend) {
863 1.45 eeh DPRINTF(IDB_BUSDMA,
864 1.45 eeh ("iommu_dvmamap_load_raw: map %p "
865 1.45 eeh "loading va %lx at pa %lx\n",
866 1.45 eeh map, (long)dvmaddr,
867 1.45 eeh (long)(pa)));
868 1.45 eeh /* Enter it if we haven't before. */
869 1.91 nakayama if (prev_va != dvmaddr) {
870 1.55 eeh iommu_enter(sb, prev_va = dvmaddr,
871 1.90 nakayama prev_pa = pa,
872 1.90 nakayama flags | IOTTE_DEBUG(++npg << 12));
873 1.91 nakayama needsflush = 1;
874 1.103 mrg
875 1.103 mrg /* Flush cache if necessary. */
876 1.103 mrg slot = IOTSBSLOT(trunc_page(dvmaddr), is->is_tsbsize);
877 1.103 mrg if ((is->is_flags & IOMMU_FLUSH_CACHE) &&
878 1.103 mrg ((dvmaddr + pagesz) > sgend || (slot % 8) == 7))
879 1.103 mrg IOMMUREG_WRITE(is, iommu_cache_flush,
880 1.103 mrg is->is_ptsb + slot * 8);
881 1.91 nakayama }
882 1.103 mrg
883 1.45 eeh dvmaddr += pagesz;
884 1.45 eeh pa += pagesz;
885 1.92 nakayama last_va = dvmaddr;
886 1.45 eeh }
887 1.45 eeh
888 1.92 nakayama len -= left;
889 1.45 eeh ++j;
890 1.26 martin }
891 1.91 nakayama if (needsflush)
892 1.91 nakayama iommu_strbuf_flush_done(sb);
893 1.45 eeh
894 1.92 nakayama map->dm_mapsize = size;
895 1.45 eeh map->dm_nsegs = j;
896 1.45 eeh #ifdef DIAGNOSTIC
897 1.45 eeh { int seg;
898 1.45 eeh for (seg = 0; seg < map->dm_nsegs; seg++) {
899 1.45 eeh if (map->dm_segs[seg].ds_addr < is->is_dvmabase ||
900 1.103 mrg map->dm_segs[seg].ds_addr > is->is_dvmaend) {
901 1.45 eeh printf("seg %d dvmaddr %lx out of range %x - %x\n",
902 1.58 chs seg, (long)map->dm_segs[seg].ds_addr,
903 1.45 eeh is->is_dvmabase, is->is_dvmaend);
904 1.57 chs #ifdef DDB
905 1.45 eeh Debugger();
906 1.57 chs #endif
907 1.45 eeh }
908 1.45 eeh }
909 1.45 eeh }
910 1.45 eeh #endif
911 1.26 martin return (0);
912 1.26 martin }
913 1.58 chs
914 1.9 eeh /*
915 1.40 eeh * This was allocated with bus_dmamem_alloc.
916 1.58 chs * The pages are on a `pglist'.
917 1.9 eeh */
918 1.26 martin i = 0;
919 1.40 eeh sgstart = dvmaddr;
920 1.40 eeh sgend = sgstart + size - 1;
921 1.40 eeh map->dm_segs[i].ds_addr = sgstart;
922 1.90 nakayama while ((sgstart & bmask) != (sgend & bmask)) {
923 1.40 eeh /* Oops. We crossed a boundary. Split the xfer. */
924 1.53 eeh map->dm_segs[i].ds_len = boundary - (sgstart & (boundary - 1));
925 1.40 eeh DPRINTF(IDB_INFO, ("iommu_dvmamap_load_raw: "
926 1.40 eeh "seg %d start %lx size %lx\n", i,
927 1.48 eeh (long)map->dm_segs[i].ds_addr,
928 1.61 martin (long)map->dm_segs[i].ds_len));
929 1.53 eeh if (++i >= map->_dm_segcnt) {
930 1.40 eeh /* Too many segments. Fail the operation. */
931 1.92 nakayama goto fail;
932 1.40 eeh }
933 1.93 nakayama sgstart += map->dm_segs[i-1].ds_len;
934 1.40 eeh map->dm_segs[i].ds_addr = sgstart;
935 1.40 eeh }
936 1.40 eeh DPRINTF(IDB_INFO, ("iommu_dvmamap_load_raw: "
937 1.40 eeh "seg %d start %lx size %lx\n", i,
938 1.61 martin (long)map->dm_segs[i].ds_addr, (long)map->dm_segs[i].ds_len));
939 1.40 eeh map->dm_segs[i].ds_len = sgend - sgstart + 1;
940 1.9 eeh
941 1.91 nakayama needsflush = 0;
942 1.83 ad TAILQ_FOREACH(pg, pglist, pageq.queue) {
943 1.9 eeh if (sgsize == 0)
944 1.9 eeh panic("iommu_dmamap_load_raw: size botch");
945 1.58 chs pa = VM_PAGE_TO_PHYS(pg);
946 1.9 eeh
947 1.22 mrg DPRINTF(IDB_BUSDMA,
948 1.9 eeh ("iommu_dvmamap_load_raw: map %p loading va %lx at pa %lx\n",
949 1.9 eeh map, (long)dvmaddr, (long)(pa)));
950 1.90 nakayama iommu_enter(sb, dvmaddr, pa, flags | IOTTE_DEBUG(0x8000));
951 1.91 nakayama needsflush = 1;
952 1.58 chs
953 1.103 mrg sgsize -= pagesz;
954 1.103 mrg
955 1.103 mrg /* Flush cache if necessary. */
956 1.103 mrg slot = IOTSBSLOT(trunc_page(dvmaddr), is->is_tsbsize);
957 1.103 mrg if ((is->is_flags & IOMMU_FLUSH_CACHE) &&
958 1.103 mrg (sgsize == 0 || (slot % 8) == 7))
959 1.103 mrg IOMMUREG_WRITE(is, iommu_cache_flush,
960 1.103 mrg is->is_ptsb + slot * 8);
961 1.103 mrg
962 1.102 mrg dvmaddr += pagesz;
963 1.9 eeh }
964 1.91 nakayama if (needsflush)
965 1.91 nakayama iommu_strbuf_flush_done(sb);
966 1.40 eeh map->dm_mapsize = size;
967 1.40 eeh map->dm_nsegs = i+1;
968 1.45 eeh #ifdef DIAGNOSTIC
969 1.45 eeh { int seg;
970 1.45 eeh for (seg = 0; seg < map->dm_nsegs; seg++) {
971 1.45 eeh if (map->dm_segs[seg].ds_addr < is->is_dvmabase ||
972 1.45 eeh map->dm_segs[seg].ds_addr > is->is_dvmaend) {
973 1.45 eeh printf("seg %d dvmaddr %lx out of range %x - %x\n",
974 1.58 chs seg, (long)map->dm_segs[seg].ds_addr,
975 1.45 eeh is->is_dvmabase, is->is_dvmaend);
976 1.57 chs #ifdef DDB
977 1.45 eeh Debugger();
978 1.57 chs #endif
979 1.45 eeh }
980 1.45 eeh }
981 1.45 eeh }
982 1.45 eeh #endif
983 1.9 eeh return (0);
984 1.92 nakayama
985 1.92 nakayama fail:
986 1.107 mrg mutex_enter(&is->is_lock);
987 1.92 nakayama err = extent_free(is->is_dvmamap, map->_dm_dvmastart, sgsize,
988 1.92 nakayama EX_NOWAIT);
989 1.92 nakayama map->_dm_dvmastart = 0;
990 1.92 nakayama map->_dm_dvmasize = 0;
991 1.107 mrg mutex_exit(&is->is_lock);
992 1.95 nakayama if (err != 0)
993 1.95 nakayama printf("warning: %s: %" PRId64 " of DVMA space lost\n",
994 1.95 nakayama __func__, sgsize);
995 1.92 nakayama return (EFBIG);
996 1.7 mrg }
997 1.7 mrg
998 1.67 petrov
999 1.67 petrov /*
1000 1.67 petrov * Flush an individual dma segment, returns non-zero if the streaming buffers
1001 1.67 petrov * need flushing afterwards.
1002 1.67 petrov */
1003 1.67 petrov static int
1004 1.67 petrov iommu_dvmamap_sync_range(struct strbuf_ctl *sb, vaddr_t va, bus_size_t len)
1005 1.67 petrov {
1006 1.67 petrov vaddr_t vaend;
1007 1.67 petrov struct iommu_state *is = sb->sb_is;
1008 1.67 petrov
1009 1.67 petrov #ifdef DIAGNOSTIC
1010 1.67 petrov if (va < is->is_dvmabase || va > is->is_dvmaend)
1011 1.67 petrov panic("invalid va: %llx", (long long)va);
1012 1.67 petrov #endif
1013 1.67 petrov
1014 1.67 petrov if ((is->is_tsb[IOTSBSLOT(va, is->is_tsbsize)] & IOTTE_STREAM) == 0) {
1015 1.103 mrg DPRINTF(IDB_SYNC,
1016 1.67 petrov ("iommu_dvmamap_sync_range: attempting to flush "
1017 1.67 petrov "non-streaming entry\n"));
1018 1.67 petrov return (0);
1019 1.67 petrov }
1020 1.67 petrov
1021 1.90 nakayama vaend = round_page(va + len) - 1;
1022 1.87 nakayama va = trunc_page(va);
1023 1.67 petrov
1024 1.67 petrov #ifdef DIAGNOSTIC
1025 1.67 petrov if (va < is->is_dvmabase || vaend > is->is_dvmaend)
1026 1.67 petrov panic("invalid va range: %llx to %llx (%x to %x)",
1027 1.67 petrov (long long)va, (long long)vaend,
1028 1.67 petrov is->is_dvmabase,
1029 1.67 petrov is->is_dvmaend);
1030 1.67 petrov #endif
1031 1.67 petrov
1032 1.67 petrov for ( ; va <= vaend; va += PAGE_SIZE) {
1033 1.103 mrg DPRINTF(IDB_SYNC,
1034 1.67 petrov ("iommu_dvmamap_sync_range: flushing va %p\n",
1035 1.67 petrov (void *)(u_long)va));
1036 1.67 petrov iommu_strbuf_flush(sb, va);
1037 1.67 petrov }
1038 1.67 petrov
1039 1.67 petrov return (1);
1040 1.67 petrov }
1041 1.67 petrov
1042 1.85 nakayama static void
1043 1.85 nakayama _iommu_dvmamap_sync(bus_dma_tag_t t, bus_dmamap_t map, bus_addr_t offset,
1044 1.85 nakayama bus_size_t len, int ops)
1045 1.7 mrg {
1046 1.85 nakayama struct strbuf_ctl *sb = (struct strbuf_ctl *)map->_dm_cookie;
1047 1.67 petrov bus_size_t count;
1048 1.67 petrov int i, needsflush = 0;
1049 1.63 petrov
1050 1.63 petrov if (!sb->sb_flush)
1051 1.63 petrov return;
1052 1.7 mrg
1053 1.67 petrov for (i = 0; i < map->dm_nsegs; i++) {
1054 1.67 petrov if (offset < map->dm_segs[i].ds_len)
1055 1.67 petrov break;
1056 1.67 petrov offset -= map->dm_segs[i].ds_len;
1057 1.67 petrov }
1058 1.60 petrov
1059 1.67 petrov if (i == map->dm_nsegs)
1060 1.103 mrg panic("%s: segment too short %llu", __func__,
1061 1.68 martin (unsigned long long)offset);
1062 1.60 petrov
1063 1.62 petrov if (ops & (BUS_DMASYNC_PREREAD | BUS_DMASYNC_POSTWRITE)) {
1064 1.60 petrov /* Nothing to do */;
1065 1.60 petrov }
1066 1.60 petrov
1067 1.62 petrov if (ops & (BUS_DMASYNC_POSTREAD | BUS_DMASYNC_PREWRITE)) {
1068 1.67 petrov
1069 1.67 petrov for (; len > 0 && i < map->dm_nsegs; i++) {
1070 1.67 petrov count = MIN(map->dm_segs[i].ds_len - offset, len);
1071 1.67 petrov if (count > 0 &&
1072 1.67 petrov iommu_dvmamap_sync_range(sb,
1073 1.67 petrov map->dm_segs[i].ds_addr + offset, count))
1074 1.67 petrov needsflush = 1;
1075 1.67 petrov offset = 0;
1076 1.67 petrov len -= count;
1077 1.67 petrov }
1078 1.60 petrov #ifdef DIAGNOSTIC
1079 1.67 petrov if (i == map->dm_nsegs && len > 0)
1080 1.103 mrg panic("%s: leftover %llu", __func__,
1081 1.73 nakayama (unsigned long long)len);
1082 1.60 petrov #endif
1083 1.55 eeh
1084 1.67 petrov if (needsflush)
1085 1.58 chs iommu_strbuf_flush_done(sb);
1086 1.7 mrg }
1087 1.7 mrg }
1088 1.7 mrg
1089 1.85 nakayama void
1090 1.85 nakayama iommu_dvmamap_sync(bus_dma_tag_t t, bus_dmamap_t map, bus_addr_t offset,
1091 1.85 nakayama bus_size_t len, int ops)
1092 1.85 nakayama {
1093 1.85 nakayama
1094 1.89 jdc /* If len is 0, then there is nothing to do */
1095 1.89 jdc if (len == 0)
1096 1.89 jdc return;
1097 1.89 jdc
1098 1.85 nakayama if (ops & (BUS_DMASYNC_PREREAD | BUS_DMASYNC_PREWRITE)) {
1099 1.85 nakayama /* Flush the CPU then the IOMMU */
1100 1.85 nakayama bus_dmamap_sync(t->_parent, map, offset, len, ops);
1101 1.85 nakayama _iommu_dvmamap_sync(t, map, offset, len, ops);
1102 1.85 nakayama }
1103 1.85 nakayama if (ops & (BUS_DMASYNC_POSTREAD | BUS_DMASYNC_POSTWRITE)) {
1104 1.85 nakayama /* Flush the IOMMU then the CPU */
1105 1.85 nakayama _iommu_dvmamap_sync(t, map, offset, len, ops);
1106 1.85 nakayama bus_dmamap_sync(t->_parent, map, offset, len, ops);
1107 1.85 nakayama }
1108 1.85 nakayama }
1109 1.85 nakayama
1110 1.7 mrg int
1111 1.85 nakayama iommu_dvmamem_alloc(bus_dma_tag_t t, bus_size_t size, bus_size_t alignment,
1112 1.85 nakayama bus_size_t boundary, bus_dma_segment_t *segs, int nsegs, int *rsegs,
1113 1.85 nakayama int flags)
1114 1.7 mrg {
1115 1.7 mrg
1116 1.25 mrg DPRINTF(IDB_BUSDMA, ("iommu_dvmamem_alloc: sz %llx align %llx bound %llx "
1117 1.25 mrg "segp %p flags %d\n", (unsigned long long)size,
1118 1.25 mrg (unsigned long long)alignment, (unsigned long long)boundary,
1119 1.25 mrg segs, flags));
1120 1.7 mrg return (bus_dmamem_alloc(t->_parent, size, alignment, boundary,
1121 1.21 eeh segs, nsegs, rsegs, flags|BUS_DMA_DVMA));
1122 1.7 mrg }
1123 1.7 mrg
1124 1.7 mrg void
1125 1.85 nakayama iommu_dvmamem_free(bus_dma_tag_t t, bus_dma_segment_t *segs, int nsegs)
1126 1.7 mrg {
1127 1.7 mrg
1128 1.22 mrg DPRINTF(IDB_BUSDMA, ("iommu_dvmamem_free: segp %p nsegs %d\n",
1129 1.7 mrg segs, nsegs));
1130 1.7 mrg bus_dmamem_free(t->_parent, segs, nsegs);
1131 1.7 mrg }
1132 1.7 mrg
1133 1.7 mrg /*
1134 1.7 mrg * Map the DVMA mappings into the kernel pmap.
1135 1.7 mrg * Check the flags to see whether we're streaming or coherent.
1136 1.7 mrg */
1137 1.7 mrg int
1138 1.85 nakayama iommu_dvmamem_map(bus_dma_tag_t t, bus_dma_segment_t *segs, int nsegs,
1139 1.85 nakayama size_t size, void **kvap, int flags)
1140 1.7 mrg {
1141 1.58 chs struct vm_page *pg;
1142 1.7 mrg vaddr_t va;
1143 1.7 mrg bus_addr_t addr;
1144 1.58 chs struct pglist *pglist;
1145 1.8 mrg int cbit;
1146 1.77 yamt const uvm_flag_t kmflags =
1147 1.77 yamt (flags & BUS_DMA_NOWAIT) != 0 ? UVM_KMF_NOWAIT : 0;
1148 1.7 mrg
1149 1.22 mrg DPRINTF(IDB_BUSDMA, ("iommu_dvmamem_map: segp %p nsegs %d size %lx\n",
1150 1.7 mrg segs, nsegs, size));
1151 1.7 mrg
1152 1.7 mrg /*
1153 1.8 mrg * Allocate some space in the kernel map, and then map these pages
1154 1.8 mrg * into this space.
1155 1.7 mrg */
1156 1.8 mrg size = round_page(size);
1157 1.77 yamt va = uvm_km_alloc(kernel_map, size, 0, UVM_KMF_VAONLY | kmflags);
1158 1.8 mrg if (va == 0)
1159 1.8 mrg return (ENOMEM);
1160 1.7 mrg
1161 1.81 christos *kvap = (void *)va;
1162 1.7 mrg
1163 1.58 chs /*
1164 1.7 mrg * digest flags:
1165 1.7 mrg */
1166 1.7 mrg cbit = 0;
1167 1.7 mrg if (flags & BUS_DMA_COHERENT) /* Disable vcache */
1168 1.7 mrg cbit |= PMAP_NVC;
1169 1.97 skrll if (flags & BUS_DMA_NOCACHE) /* side effects */
1170 1.7 mrg cbit |= PMAP_NC;
1171 1.7 mrg
1172 1.7 mrg /*
1173 1.8 mrg * Now take this and map it into the CPU.
1174 1.7 mrg */
1175 1.58 chs pglist = segs[0]._ds_mlist;
1176 1.83 ad TAILQ_FOREACH(pg, pglist, pageq.queue) {
1177 1.8 mrg #ifdef DIAGNOSTIC
1178 1.7 mrg if (size == 0)
1179 1.7 mrg panic("iommu_dvmamem_map: size botch");
1180 1.8 mrg #endif
1181 1.58 chs addr = VM_PAGE_TO_PHYS(pg);
1182 1.22 mrg DPRINTF(IDB_BUSDMA, ("iommu_dvmamem_map: "
1183 1.25 mrg "mapping va %lx at %llx\n", va, (unsigned long long)addr | cbit));
1184 1.88 cegger pmap_kenter_pa(va, addr | cbit,
1185 1.88 cegger VM_PROT_READ | VM_PROT_WRITE, 0);
1186 1.7 mrg va += PAGE_SIZE;
1187 1.7 mrg size -= PAGE_SIZE;
1188 1.7 mrg }
1189 1.38 chris pmap_update(pmap_kernel());
1190 1.7 mrg return (0);
1191 1.7 mrg }
1192 1.7 mrg
1193 1.7 mrg /*
1194 1.7 mrg * Unmap DVMA mappings from kernel
1195 1.7 mrg */
1196 1.7 mrg void
1197 1.85 nakayama iommu_dvmamem_unmap(bus_dma_tag_t t, void *kva, size_t size)
1198 1.7 mrg {
1199 1.58 chs
1200 1.22 mrg DPRINTF(IDB_BUSDMA, ("iommu_dvmamem_unmap: kvm %p size %lx\n",
1201 1.7 mrg kva, size));
1202 1.58 chs
1203 1.7 mrg #ifdef DIAGNOSTIC
1204 1.7 mrg if ((u_long)kva & PGOFSET)
1205 1.7 mrg panic("iommu_dvmamem_unmap");
1206 1.7 mrg #endif
1207 1.58 chs
1208 1.7 mrg size = round_page(size);
1209 1.58 chs pmap_kremove((vaddr_t)kva, size);
1210 1.38 chris pmap_update(pmap_kernel());
1211 1.76 yamt uvm_km_free(kernel_map, (vaddr_t)kva, size, UVM_KMF_VAONLY);
1212 1.1 mrg }
1213