Home | History | Annotate | Line # | Download | only in dev
iommu.c revision 1.107.2.1
      1  1.107.2.1  jdolecek /*	$NetBSD: iommu.c,v 1.107.2.1 2017/12/03 11:36:44 jdolecek Exp $	*/
      2       1.82       mrg 
      3       1.82       mrg /*
      4       1.82       mrg  * Copyright (c) 1999, 2000 Matthew R. Green
      5       1.82       mrg  * All rights reserved.
      6       1.82       mrg  *
      7       1.82       mrg  * Redistribution and use in source and binary forms, with or without
      8       1.82       mrg  * modification, are permitted provided that the following conditions
      9       1.82       mrg  * are met:
     10       1.82       mrg  * 1. Redistributions of source code must retain the above copyright
     11       1.82       mrg  *    notice, this list of conditions and the following disclaimer.
     12       1.82       mrg  * 2. Redistributions in binary form must reproduce the above copyright
     13       1.82       mrg  *    notice, this list of conditions and the following disclaimer in the
     14       1.82       mrg  *    documentation and/or other materials provided with the distribution.
     15       1.82       mrg  *
     16       1.82       mrg  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
     17       1.82       mrg  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
     18       1.82       mrg  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
     19       1.82       mrg  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
     20       1.82       mrg  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
     21       1.82       mrg  * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
     22       1.82       mrg  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
     23       1.82       mrg  * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
     24       1.82       mrg  * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     25       1.82       mrg  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     26       1.82       mrg  * SUCH DAMAGE.
     27       1.82       mrg  */
     28        1.7       mrg 
     29        1.7       mrg /*
     30       1.48       eeh  * Copyright (c) 2001, 2002 Eduardo Horvath
     31        1.7       mrg  * All rights reserved.
     32        1.7       mrg  *
     33        1.7       mrg  * Redistribution and use in source and binary forms, with or without
     34        1.7       mrg  * modification, are permitted provided that the following conditions
     35        1.7       mrg  * are met:
     36        1.7       mrg  * 1. Redistributions of source code must retain the above copyright
     37        1.7       mrg  *    notice, this list of conditions and the following disclaimer.
     38        1.7       mrg  * 2. Redistributions in binary form must reproduce the above copyright
     39        1.7       mrg  *    notice, this list of conditions and the following disclaimer in the
     40        1.7       mrg  *    documentation and/or other materials provided with the distribution.
     41        1.7       mrg  * 3. The name of the author may not be used to endorse or promote products
     42        1.7       mrg  *    derived from this software without specific prior written permission.
     43        1.7       mrg  *
     44        1.7       mrg  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
     45        1.7       mrg  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
     46        1.7       mrg  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
     47        1.7       mrg  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
     48        1.7       mrg  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
     49        1.7       mrg  * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
     50        1.7       mrg  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
     51        1.7       mrg  * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
     52        1.7       mrg  * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     53        1.7       mrg  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     54        1.7       mrg  * SUCH DAMAGE.
     55        1.7       mrg  */
     56        1.1       mrg 
     57        1.7       mrg /*
     58        1.7       mrg  * UltraSPARC IOMMU support; used by both the sbus and pci code.
     59        1.7       mrg  */
     60       1.66     lukem 
     61       1.66     lukem #include <sys/cdefs.h>
     62  1.107.2.1  jdolecek __KERNEL_RCSID(0, "$NetBSD: iommu.c,v 1.107.2.1 2017/12/03 11:36:44 jdolecek Exp $");
     63       1.66     lukem 
     64        1.4       mrg #include "opt_ddb.h"
     65        1.4       mrg 
     66        1.1       mrg #include <sys/param.h>
     67        1.1       mrg #include <sys/extent.h>
     68        1.1       mrg #include <sys/malloc.h>
     69        1.1       mrg #include <sys/systm.h>
     70        1.1       mrg #include <sys/device.h>
     71       1.41       chs #include <sys/proc.h>
     72       1.18       mrg 
     73      1.100  uebayasi #include <uvm/uvm.h>
     74        1.1       mrg 
     75      1.104    dyoung #include <sys/bus.h>
     76        1.1       mrg #include <sparc64/dev/iommureg.h>
     77        1.1       mrg #include <sparc64/dev/iommuvar.h>
     78        1.1       mrg 
     79        1.1       mrg #include <machine/autoconf.h>
     80        1.1       mrg #include <machine/cpu.h>
     81  1.107.2.1  jdolecek #include <machine/hypervisor.h>
     82        1.1       mrg 
     83        1.1       mrg #ifdef DEBUG
     84       1.22       mrg #define IDB_BUSDMA	0x1
     85       1.22       mrg #define IDB_IOMMU	0x2
     86       1.22       mrg #define IDB_INFO	0x4
     87       1.36       eeh #define	IDB_SYNC	0x8
     88       1.10       mrg int iommudebug = 0x0;
     89        1.4       mrg #define DPRINTF(l, s)   do { if (iommudebug & l) printf s; } while (0)
     90       1.90  nakayama #define IOTTE_DEBUG(n)	(n)
     91        1.4       mrg #else
     92        1.4       mrg #define DPRINTF(l, s)
     93       1.90  nakayama #define IOTTE_DEBUG(n)	0
     94        1.1       mrg #endif
     95        1.1       mrg 
     96       1.55       eeh #define iommu_strbuf_flush(i, v) do {					\
     97       1.55       eeh 	if ((i)->sb_flush)						\
     98       1.55       eeh 		bus_space_write_8((i)->sb_is->is_bustag, (i)->sb_sb,	\
     99       1.50       eeh 			STRBUFREG(strbuf_pgflush), (v));		\
    100       1.42       eeh 	} while (0)
    101       1.42       eeh 
    102       1.78       cdi static	int iommu_strbuf_flush_done(struct strbuf_ctl *);
    103       1.85  nakayama static	void _iommu_dvmamap_sync(bus_dma_tag_t, bus_dmamap_t, bus_addr_t,
    104       1.85  nakayama 		bus_size_t, int);
    105  1.107.2.1  jdolecek static void iommu_enter_sun4u(struct strbuf_ctl *sb, vaddr_t va, int64_t pa, int flags);
    106  1.107.2.1  jdolecek static void iommu_enter_sun4v(struct strbuf_ctl *sb, vaddr_t va, int64_t pa, int flags);
    107  1.107.2.1  jdolecek static void iommu_remove_sun4u(struct iommu_state *is, vaddr_t va, size_t len);
    108  1.107.2.1  jdolecek static void iommu_remove_sun4v(struct iommu_state *is, vaddr_t va, size_t len);
    109       1.11       eeh 
    110        1.1       mrg /*
    111        1.1       mrg  * initialise the UltraSPARC IOMMU (SBUS or PCI):
    112        1.1       mrg  *	- allocate and setup the iotsb.
    113        1.1       mrg  *	- enable the IOMMU
    114        1.7       mrg  *	- initialise the streaming buffers (if they exist)
    115        1.1       mrg  *	- create a private DVMA map.
    116        1.1       mrg  */
    117        1.1       mrg void
    118       1.79       cdi iommu_init(char *name, struct iommu_state *is, int tsbsize, uint32_t iovabase)
    119        1.1       mrg {
    120       1.11       eeh 	psize_t size;
    121       1.11       eeh 	vaddr_t va;
    122       1.11       eeh 	paddr_t pa;
    123       1.58       chs 	struct vm_page *pg;
    124       1.58       chs 	struct pglist pglist;
    125        1.1       mrg 
    126  1.107.2.1  jdolecek 	DPRINTF(IDB_INFO, ("iommu_init: tsbsize %x iovabase %x\n", tsbsize, iovabase));
    127  1.107.2.1  jdolecek 
    128        1.1       mrg 	/*
    129        1.1       mrg 	 * Setup the iommu.
    130        1.1       mrg 	 *
    131       1.45       eeh 	 * The sun4u iommu is part of the SBUS or PCI controller so we will
    132       1.45       eeh 	 * deal with it here..
    133        1.1       mrg 	 *
    134       1.45       eeh 	 * For sysio and psycho/psycho+ the IOMMU address space always ends at
    135       1.45       eeh 	 * 0xffffe000, but the starting address depends on the size of the
    136       1.45       eeh 	 * map.  The map size is 1024 * 2 ^ is->is_tsbsize entries, where each
    137       1.45       eeh 	 * entry is 8 bytes.  The start of the map can be calculated by
    138       1.45       eeh 	 * (0xffffe000 << (8 + is->is_tsbsize)).
    139       1.45       eeh 	 *
    140       1.45       eeh 	 * But sabre and hummingbird use a different scheme that seems to
    141       1.45       eeh 	 * be hard-wired, so we read the start and size from the PROM and
    142       1.45       eeh 	 * just use those values.
    143        1.2       eeh 	 */
    144  1.107.2.1  jdolecek 	if (strncmp(name, "pyro", 4) == 0) {
    145  1.107.2.1  jdolecek 		is->is_cr = IOMMUREG_READ(is, iommu_cr);
    146  1.107.2.1  jdolecek 		is->is_cr &= ~IOMMUCR_FIRE_BE;
    147  1.107.2.1  jdolecek 		is->is_cr |= (IOMMUCR_FIRE_SE | IOMMUCR_FIRE_CM_EN |
    148  1.107.2.1  jdolecek 		    IOMMUCR_FIRE_TE);
    149  1.107.2.1  jdolecek 	} else
    150  1.107.2.1  jdolecek 		is->is_cr = IOMMUCR_EN;
    151       1.11       eeh 	is->is_tsbsize = tsbsize;
    152       1.45       eeh 	if (iovabase == -1) {
    153       1.45       eeh 		is->is_dvmabase = IOTSB_VSTART(is->is_tsbsize);
    154       1.90  nakayama 		is->is_dvmaend = IOTSB_VEND - 1;
    155       1.45       eeh 	} else {
    156       1.45       eeh 		is->is_dvmabase = iovabase;
    157       1.90  nakayama 		is->is_dvmaend = iovabase + IOTSB_VSIZE(tsbsize) - 1;
    158       1.45       eeh 	}
    159       1.11       eeh 
    160       1.11       eeh 	/*
    161       1.15       eeh 	 * Allocate memory for I/O pagetables.  They need to be physically
    162       1.15       eeh 	 * contiguous.
    163       1.11       eeh 	 */
    164       1.11       eeh 
    165       1.64   thorpej 	size = PAGE_SIZE << is->is_tsbsize;
    166       1.11       eeh 	if (uvm_pglistalloc((psize_t)size, (paddr_t)0, (paddr_t)-1,
    167       1.64   thorpej 		(paddr_t)PAGE_SIZE, (paddr_t)0, &pglist, 1, 0) != 0)
    168       1.11       eeh 		panic("iommu_init: no memory");
    169       1.11       eeh 
    170       1.76      yamt 	va = uvm_km_alloc(kernel_map, size, 0, UVM_KMF_VAONLY);
    171       1.11       eeh 	if (va == 0)
    172       1.11       eeh 		panic("iommu_init: no memory");
    173       1.11       eeh 	is->is_tsb = (int64_t *)va;
    174       1.11       eeh 
    175       1.58       chs 	is->is_ptsb = VM_PAGE_TO_PHYS(TAILQ_FIRST(&pglist));
    176       1.11       eeh 
    177       1.11       eeh 	/* Map the pages */
    178       1.83        ad 	TAILQ_FOREACH(pg, &pglist, pageq.queue) {
    179       1.58       chs 		pa = VM_PAGE_TO_PHYS(pg);
    180       1.88    cegger 		pmap_kenter_pa(va, pa | PMAP_NVC,
    181       1.88    cegger 		    VM_PROT_READ | VM_PROT_WRITE, 0);
    182       1.64   thorpej 		va += PAGE_SIZE;
    183       1.11       eeh 	}
    184       1.38     chris 	pmap_update(pmap_kernel());
    185       1.58       chs 	memset(is->is_tsb, 0, size);
    186        1.1       mrg 
    187        1.1       mrg #ifdef DEBUG
    188      1.102       mrg 	if (iommudebug & IDB_INFO)
    189        1.1       mrg 	{
    190        1.1       mrg 		/* Probe the iommu */
    191  1.107.2.1  jdolecek 		if (!CPU_ISSUN4V) {
    192  1.107.2.1  jdolecek 			printf("iommu cr=%llx tsb=%llx\n",
    193  1.107.2.1  jdolecek 			    (unsigned long long)bus_space_read_8(is->is_bustag,
    194       1.50       eeh 				is->is_iommu,
    195      1.103       mrg 				offsetof(struct iommureg, iommu_cr)),
    196  1.107.2.1  jdolecek 			    (unsigned long long)bus_space_read_8(is->is_bustag,
    197       1.50       eeh 				is->is_iommu,
    198      1.103       mrg 				offsetof(struct iommureg, iommu_tsb)));
    199  1.107.2.1  jdolecek 			printf("TSB base %p phys %llx\n", (void *)is->is_tsb,
    200  1.107.2.1  jdolecek 			    (unsigned long long)is->is_ptsb);
    201  1.107.2.1  jdolecek 			delay(1000000); /* 1 s */
    202  1.107.2.1  jdolecek 		}
    203        1.1       mrg 	}
    204        1.1       mrg #endif
    205        1.1       mrg 
    206        1.1       mrg 	/*
    207        1.1       mrg 	 * Now all the hardware's working we need to allocate a dvma map.
    208        1.1       mrg 	 */
    209       1.98       mrg 	aprint_debug("DVMA map: %x to %x\n",
    210       1.11       eeh 		(unsigned int)is->is_dvmabase,
    211       1.45       eeh 		(unsigned int)is->is_dvmaend);
    212       1.98       mrg 	aprint_debug("IOTSB: %llx to %llx\n",
    213       1.47       eeh 		(unsigned long long)is->is_ptsb,
    214       1.90  nakayama 		(unsigned long long)(is->is_ptsb + size - 1));
    215        1.1       mrg 	is->is_dvmamap = extent_create(name,
    216       1.90  nakayama 	    is->is_dvmabase, is->is_dvmaend,
    217      1.106      para 	    0, 0, EX_NOWAIT);
    218  1.107.2.1  jdolecek 	if (!is->is_dvmamap)
    219  1.107.2.1  jdolecek 		panic("iommu_init: extent_create() failed");
    220  1.107.2.1  jdolecek 
    221      1.107       mrg 	mutex_init(&is->is_lock, MUTEX_DEFAULT, IPL_HIGH);
    222      1.107       mrg 
    223      1.103       mrg 	/*
    224      1.103       mrg 	 * Set the TSB size.  The relevant bits were moved to the TSB
    225      1.103       mrg 	 * base register in the PCIe host bridges.
    226      1.103       mrg 	 */
    227      1.103       mrg 	if (is->is_flags & IOMMU_TSBSIZE_IN_PTSB)
    228      1.103       mrg 		is->is_ptsb |= is->is_tsbsize;
    229      1.103       mrg 	else
    230      1.103       mrg 		is->is_cr |= (is->is_tsbsize << 16);
    231      1.103       mrg 
    232      1.103       mrg 	/*
    233      1.103       mrg 	 * now actually start up the IOMMU
    234      1.103       mrg 	 */
    235      1.103       mrg 	iommu_reset(is);
    236        1.1       mrg }
    237        1.1       mrg 
    238        1.8       mrg /*
    239        1.8       mrg  * Streaming buffers don't exist on the UltraSPARC IIi; we should have
    240        1.8       mrg  * detected that already and disabled them.  If not, we will notice that
    241        1.8       mrg  * they aren't there when the STRBUF_EN bit does not remain.
    242        1.8       mrg  */
    243        1.1       mrg void
    244       1.78       cdi iommu_reset(struct iommu_state *is)
    245        1.1       mrg {
    246       1.45       eeh 	int i;
    247       1.55       eeh 	struct strbuf_ctl *sb;
    248        1.1       mrg 
    249  1.107.2.1  jdolecek 	if (CPU_ISSUN4V)
    250  1.107.2.1  jdolecek 		return;
    251  1.107.2.1  jdolecek 
    252      1.103       mrg 	IOMMUREG_WRITE(is, iommu_tsb, is->is_ptsb);
    253       1.50       eeh 
    254       1.11       eeh 	/* Enable IOMMU in diagnostic mode */
    255      1.103       mrg 	IOMMUREG_WRITE(is, iommu_cr, is->is_cr|IOMMUCR_DE);
    256       1.11       eeh 
    257       1.58       chs 	for (i = 0; i < 2; i++) {
    258       1.55       eeh 		if ((sb = is->is_sb[i])) {
    259        1.5       mrg 
    260       1.45       eeh 			/* Enable diagnostics mode? */
    261       1.58       chs 			bus_space_write_8(is->is_bustag, is->is_sb[i]->sb_sb,
    262       1.50       eeh 				STRBUFREG(strbuf_ctl), STRBUF_EN);
    263       1.45       eeh 
    264      1.105  nakayama 			membar_Lookaside();
    265      1.103       mrg 
    266       1.45       eeh 			/* No streaming buffers? Disable them */
    267       1.58       chs 			if (bus_space_read_8(is->is_bustag,
    268       1.58       chs 				is->is_sb[i]->sb_sb,
    269       1.55       eeh 				STRBUFREG(strbuf_ctl)) == 0) {
    270       1.55       eeh 				is->is_sb[i]->sb_flush = NULL;
    271       1.55       eeh 			} else {
    272       1.58       chs 
    273       1.55       eeh 				/*
    274       1.55       eeh 				 * locate the pa of the flush buffer.
    275       1.55       eeh 				 */
    276      1.103       mrg 				if (pmap_extract(pmap_kernel(),
    277      1.103       mrg 				     (vaddr_t)is->is_sb[i]->sb_flush,
    278      1.103       mrg 				     &is->is_sb[i]->sb_flushpa) == FALSE)
    279      1.103       mrg 					is->is_sb[i]->sb_flush = NULL;
    280       1.55       eeh 			}
    281       1.45       eeh 		}
    282       1.42       eeh 	}
    283      1.103       mrg 
    284      1.103       mrg 	if (is->is_flags & IOMMU_FLUSH_CACHE)
    285      1.103       mrg 		IOMMUREG_WRITE(is, iommu_cache_invalidate, -1ULL);
    286        1.2       eeh }
    287        1.2       eeh 
    288        1.2       eeh /*
    289       1.58       chs  * Here are the iommu control routines.
    290        1.2       eeh  */
    291  1.107.2.1  jdolecek 
    292        1.2       eeh void
    293       1.78       cdi iommu_enter(struct strbuf_ctl *sb, vaddr_t va, int64_t pa, int flags)
    294        1.2       eeh {
    295  1.107.2.1  jdolecek 	DPRINTF(IDB_IOMMU, ("iommu_enter: va %lx pa %lx flags %x\n",
    296  1.107.2.1  jdolecek 	    va, (long)pa, flags));
    297  1.107.2.1  jdolecek 	if (!CPU_ISSUN4V)
    298  1.107.2.1  jdolecek 		iommu_enter_sun4u(sb, va, pa, flags);
    299  1.107.2.1  jdolecek 	else
    300  1.107.2.1  jdolecek 		iommu_enter_sun4v(sb, va, pa, flags);
    301  1.107.2.1  jdolecek }
    302  1.107.2.1  jdolecek 
    303  1.107.2.1  jdolecek 
    304  1.107.2.1  jdolecek void
    305  1.107.2.1  jdolecek iommu_enter_sun4u(struct strbuf_ctl *sb, vaddr_t va, int64_t pa, int flags)
    306  1.107.2.1  jdolecek {
    307       1.55       eeh 	struct iommu_state *is = sb->sb_is;
    308       1.55       eeh 	int strbuf = (flags & BUS_DMA_STREAMING);
    309        1.2       eeh 	int64_t tte;
    310        1.2       eeh 
    311        1.2       eeh #ifdef DIAGNOSTIC
    312       1.45       eeh 	if (va < is->is_dvmabase || va > is->is_dvmaend)
    313       1.13       mrg 		panic("iommu_enter: va %#lx not in DVMA space", va);
    314        1.2       eeh #endif
    315        1.2       eeh 
    316       1.55       eeh 	/* Is the streamcache flush really needed? */
    317       1.91  nakayama 	if (sb->sb_flush)
    318       1.55       eeh 		iommu_strbuf_flush(sb, va);
    319       1.91  nakayama 	else
    320       1.55       eeh 		/* If we can't flush the strbuf don't enable it. */
    321       1.55       eeh 		strbuf = 0;
    322       1.55       eeh 
    323       1.58       chs 	tte = MAKEIOTTE(pa, !(flags & BUS_DMA_NOWRITE),
    324       1.55       eeh 		!(flags & BUS_DMA_NOCACHE), (strbuf));
    325       1.50       eeh #ifdef DEBUG
    326       1.50       eeh 	tte |= (flags & 0xff000LL)<<(4*8);
    327       1.50       eeh #endif
    328       1.58       chs 
    329        1.2       eeh 	is->is_tsb[IOTSBSLOT(va,is->is_tsbsize)] = tte;
    330       1.58       chs 	bus_space_write_8(is->is_bustag, is->is_iommu,
    331       1.50       eeh 		IOMMUREG(iommu_flush), va);
    332      1.103       mrg 	DPRINTF(IDB_IOMMU, ("iommu_enter: slot %d va %lx pa %lx "
    333      1.103       mrg 		"TSB[%lx]@%p=%lx\n", (int)IOTSBSLOT(va,is->is_tsbsize),
    334       1.50       eeh 		va, (long)pa, (u_long)IOTSBSLOT(va,is->is_tsbsize),
    335       1.50       eeh 		(void *)(u_long)&is->is_tsb[IOTSBSLOT(va,is->is_tsbsize)],
    336       1.50       eeh 		(u_long)tte));
    337       1.39       eeh }
    338       1.39       eeh 
    339  1.107.2.1  jdolecek void
    340  1.107.2.1  jdolecek iommu_enter_sun4v(struct strbuf_ctl *sb, vaddr_t va, int64_t pa, int flags)
    341  1.107.2.1  jdolecek {
    342  1.107.2.1  jdolecek 	struct iommu_state *is = sb->sb_is;
    343  1.107.2.1  jdolecek 	u_int64_t tsbid = IOTSBSLOT(va, is->is_tsbsize);
    344  1.107.2.1  jdolecek 	paddr_t page_list[1], addr;
    345  1.107.2.1  jdolecek 	u_int64_t attr, nmapped;
    346  1.107.2.1  jdolecek 	int err;
    347  1.107.2.1  jdolecek 
    348  1.107.2.1  jdolecek #ifdef DIAGNOSTIC
    349  1.107.2.1  jdolecek 	if (va < is->is_dvmabase || (va + PAGE_MASK) > is->is_dvmaend)
    350  1.107.2.1  jdolecek 		panic("viommu_enter: va %#lx not in DVMA space", va);
    351  1.107.2.1  jdolecek #endif
    352  1.107.2.1  jdolecek 
    353  1.107.2.1  jdolecek 	attr = PCI_MAP_ATTR_READ | PCI_MAP_ATTR_WRITE;
    354  1.107.2.1  jdolecek 	if (flags & BUS_DMA_READ)
    355  1.107.2.1  jdolecek 		attr &= ~PCI_MAP_ATTR_READ;
    356  1.107.2.1  jdolecek 	if (flags & BUS_DMA_WRITE)
    357  1.107.2.1  jdolecek 		attr &= ~PCI_MAP_ATTR_WRITE;
    358  1.107.2.1  jdolecek 
    359  1.107.2.1  jdolecek 	page_list[0] = trunc_page(pa);
    360  1.107.2.1  jdolecek 	if (!pmap_extract(pmap_kernel(), (vaddr_t)page_list, &addr))
    361  1.107.2.1  jdolecek 		panic("viommu_enter: pmap_extract failed");
    362  1.107.2.1  jdolecek 	err = hv_pci_iommu_map(is->is_devhandle, tsbid, 1, attr,
    363  1.107.2.1  jdolecek 	    addr, &nmapped);
    364  1.107.2.1  jdolecek 	if (err != H_EOK || nmapped != 1)
    365  1.107.2.1  jdolecek 		panic("hv_pci_iommu_map: err=%d, nmapped=%lu", err, (long unsigned int)nmapped);
    366  1.107.2.1  jdolecek }
    367  1.107.2.1  jdolecek 
    368       1.39       eeh /*
    369       1.39       eeh  * Find the value of a DVMA address (debug routine).
    370       1.39       eeh  */
    371       1.39       eeh paddr_t
    372       1.78       cdi iommu_extract(struct iommu_state *is, vaddr_t dva)
    373       1.39       eeh {
    374       1.39       eeh 	int64_t tte = 0;
    375       1.58       chs 
    376       1.90  nakayama 	if (dva >= is->is_dvmabase && dva <= is->is_dvmaend)
    377       1.55       eeh 		tte = is->is_tsb[IOTSBSLOT(dva, is->is_tsbsize)];
    378       1.39       eeh 
    379       1.54       eeh 	if ((tte & IOTTE_V) == 0)
    380       1.39       eeh 		return ((paddr_t)-1L);
    381       1.54       eeh 	return (tte & IOTTE_PAMASK);
    382        1.2       eeh }
    383        1.2       eeh 
    384        1.2       eeh /*
    385        1.2       eeh  * iommu_remove: removes mappings created by iommu_enter
    386        1.2       eeh  *
    387        1.2       eeh  * Only demap from IOMMU if flag is set.
    388        1.8       mrg  *
    389        1.8       mrg  * XXX: this function needs better internal error checking.
    390        1.2       eeh  */
    391  1.107.2.1  jdolecek 
    392  1.107.2.1  jdolecek 
    393        1.2       eeh void
    394       1.78       cdi iommu_remove(struct iommu_state *is, vaddr_t va, size_t len)
    395        1.2       eeh {
    396  1.107.2.1  jdolecek 	DPRINTF(IDB_IOMMU, ("iommu_remove: va %lx len %zu\n", va, len));
    397  1.107.2.1  jdolecek 	if (!CPU_ISSUN4V)
    398  1.107.2.1  jdolecek 		iommu_remove_sun4u(is, va, len);
    399  1.107.2.1  jdolecek 	else
    400  1.107.2.1  jdolecek 		iommu_remove_sun4v(is, va, len);
    401  1.107.2.1  jdolecek }
    402  1.107.2.1  jdolecek 
    403  1.107.2.1  jdolecek void
    404  1.107.2.1  jdolecek iommu_remove_sun4u(struct iommu_state *is, vaddr_t va, size_t len)
    405  1.107.2.1  jdolecek {
    406  1.107.2.1  jdolecek 
    407      1.103       mrg 	int slot;
    408        1.2       eeh 
    409        1.2       eeh #ifdef DIAGNOSTIC
    410       1.45       eeh 	if (va < is->is_dvmabase || va > is->is_dvmaend)
    411       1.25       mrg 		panic("iommu_remove: va 0x%lx not in DVMA space", (u_long)va);
    412        1.2       eeh 	if ((long)(va + len) < (long)va)
    413       1.58       chs 		panic("iommu_remove: va 0x%lx + len 0x%lx wraps",
    414        1.2       eeh 		      (long) va, (long) len);
    415       1.58       chs 	if (len & ~0xfffffff)
    416       1.72       snj 		panic("iommu_remove: ridiculous len 0x%lx", (u_long)len);
    417        1.2       eeh #endif
    418        1.2       eeh 
    419        1.2       eeh 	va = trunc_page(va);
    420       1.22       mrg 	DPRINTF(IDB_IOMMU, ("iommu_remove: va %lx TSB[%lx]@%p\n",
    421       1.50       eeh 		va, (u_long)IOTSBSLOT(va, is->is_tsbsize),
    422       1.50       eeh 		&is->is_tsb[IOTSBSLOT(va, is->is_tsbsize)]));
    423        1.2       eeh 	while (len > 0) {
    424       1.50       eeh 		DPRINTF(IDB_IOMMU, ("iommu_remove: clearing TSB slot %d "
    425       1.50       eeh 			"for va %p size %lx\n",
    426       1.50       eeh 			(int)IOTSBSLOT(va,is->is_tsbsize), (void *)(u_long)va,
    427       1.50       eeh 			(u_long)len));
    428       1.64   thorpej 		if (len <= PAGE_SIZE)
    429       1.10       mrg 			len = 0;
    430       1.10       mrg 		else
    431       1.64   thorpej 			len -= PAGE_SIZE;
    432        1.8       mrg 
    433       1.99       mrg #if 0
    434       1.94  nakayama 		/*
    435       1.94  nakayama 		 * XXX Zero-ing the entry would not require RMW
    436       1.94  nakayama 		 *
    437       1.94  nakayama 		 * Disabling valid bit while a page is used by a device
    438       1.94  nakayama 		 * causes an uncorrectable DMA error.
    439       1.94  nakayama 		 * Workaround to avoid an uncorrectable DMA error is
    440       1.94  nakayama 		 * eliminating the next line, but the page is mapped
    441       1.94  nakayama 		 * until the next iommu_enter call.
    442       1.94  nakayama 		 */
    443       1.47       eeh 		is->is_tsb[IOTSBSLOT(va,is->is_tsbsize)] &= ~IOTTE_V;
    444      1.105  nakayama 		membar_StoreStore();
    445       1.99       mrg #endif
    446      1.103       mrg 		IOMMUREG_WRITE(is, iommu_flush, va);
    447      1.103       mrg 
    448      1.103       mrg 		/* Flush cache if necessary. */
    449      1.103       mrg 		slot = IOTSBSLOT(trunc_page(va), is->is_tsbsize);
    450      1.103       mrg 		if ((is->is_flags & IOMMU_FLUSH_CACHE) &&
    451      1.103       mrg 		    (len == 0 || (slot % 8) == 7))
    452      1.103       mrg 			IOMMUREG_WRITE(is, iommu_cache_flush,
    453      1.103       mrg 			    is->is_ptsb + slot * 8);
    454      1.103       mrg 
    455       1.64   thorpej 		va += PAGE_SIZE;
    456        1.2       eeh 	}
    457        1.2       eeh }
    458        1.2       eeh 
    459  1.107.2.1  jdolecek void
    460  1.107.2.1  jdolecek iommu_remove_sun4v(struct iommu_state *is, vaddr_t va, size_t len)
    461  1.107.2.1  jdolecek {
    462  1.107.2.1  jdolecek 	u_int64_t tsbid = IOTSBSLOT(va, is->is_tsbsize);
    463  1.107.2.1  jdolecek 	u_int64_t ndemapped;
    464  1.107.2.1  jdolecek 	int err;
    465  1.107.2.1  jdolecek 
    466  1.107.2.1  jdolecek #ifdef DIAGNOSTIC
    467  1.107.2.1  jdolecek 	if (va < is->is_dvmabase || (va + PAGE_MASK) > is->is_dvmaend)
    468  1.107.2.1  jdolecek 		panic("iommu_remove: va 0x%lx not in DVMA space", (u_long)va);
    469  1.107.2.1  jdolecek 	if (va != trunc_page(va)) {
    470  1.107.2.1  jdolecek 		printf("iommu_remove: unaligned va: %lx\n", va);
    471  1.107.2.1  jdolecek 		va = trunc_page(va);
    472  1.107.2.1  jdolecek 	}
    473  1.107.2.1  jdolecek #endif
    474  1.107.2.1  jdolecek 
    475  1.107.2.1  jdolecek 	err = hv_pci_iommu_demap(is->is_devhandle, tsbid, 1, &ndemapped);
    476  1.107.2.1  jdolecek 	if (err != H_EOK || ndemapped != 1)
    477  1.107.2.1  jdolecek 		panic("hv_pci_iommu_unmap: err=%d", err);
    478  1.107.2.1  jdolecek }
    479  1.107.2.1  jdolecek 
    480       1.58       chs static int
    481       1.78       cdi iommu_strbuf_flush_done(struct strbuf_ctl *sb)
    482        1.2       eeh {
    483       1.55       eeh 	struct iommu_state *is = sb->sb_is;
    484        1.2       eeh 	struct timeval cur, flushtimeout;
    485        1.2       eeh 
    486        1.2       eeh #define BUMPTIME(t, usec) { \
    487        1.2       eeh 	register volatile struct timeval *tp = (t); \
    488        1.2       eeh 	register long us; \
    489        1.2       eeh  \
    490        1.2       eeh 	tp->tv_usec = us = tp->tv_usec + (usec); \
    491        1.2       eeh 	if (us >= 1000000) { \
    492        1.2       eeh 		tp->tv_usec = us - 1000000; \
    493        1.2       eeh 		tp->tv_sec++; \
    494        1.2       eeh 	} \
    495        1.2       eeh }
    496        1.5       mrg 
    497       1.55       eeh 	if (!sb->sb_flush)
    498        1.5       mrg 		return (0);
    499       1.58       chs 
    500        1.7       mrg 	/*
    501        1.7       mrg 	 * Streaming buffer flushes:
    502       1.58       chs 	 *
    503        1.7       mrg 	 *   1 Tell strbuf to flush by storing va to strbuf_pgflush.  If
    504        1.7       mrg 	 *     we're not on a cache line boundary (64-bits):
    505        1.7       mrg 	 *   2 Store 0 in flag
    506        1.7       mrg 	 *   3 Store pointer to flag in flushsync
    507        1.7       mrg 	 *   4 wait till flushsync becomes 0x1
    508        1.7       mrg 	 *
    509        1.7       mrg 	 * If it takes more than .5 sec, something
    510        1.7       mrg 	 * went wrong.
    511        1.7       mrg 	 */
    512        1.2       eeh 
    513       1.55       eeh 	*sb->sb_flush = 0;
    514       1.58       chs 	bus_space_write_8(is->is_bustag, sb->sb_sb,
    515       1.55       eeh 		STRBUFREG(strbuf_flushsync), sb->sb_flushpa);
    516        1.2       eeh 
    517       1.58       chs 	microtime(&flushtimeout);
    518        1.2       eeh 	cur = flushtimeout;
    519        1.2       eeh 	BUMPTIME(&flushtimeout, 500000); /* 1/2 sec */
    520       1.58       chs 
    521      1.103       mrg 	DPRINTF(IDB_IOMMU, ("%s: flush = %lx at va = %lx pa = %lx now="
    522      1.103       mrg 		"%"PRIx64":%"PRIx32" until = %"PRIx64":%"PRIx32"\n", __func__,
    523       1.58       chs 		(long)*sb->sb_flush, (long)sb->sb_flush, (long)sb->sb_flushpa,
    524       1.42       eeh 		cur.tv_sec, cur.tv_usec,
    525       1.42       eeh 		flushtimeout.tv_sec, flushtimeout.tv_usec));
    526       1.42       eeh 
    527        1.2       eeh 	/* Bypass non-coherent D$ */
    528       1.55       eeh 	while ((!ldxa(sb->sb_flushpa, ASI_PHYS_CACHED)) &&
    529       1.98       mrg 	       timercmp(&cur, &flushtimeout, <=))
    530        1.2       eeh 		microtime(&cur);
    531        1.2       eeh 
    532        1.2       eeh #ifdef DIAGNOSTIC
    533       1.55       eeh 	if (!ldxa(sb->sb_flushpa, ASI_PHYS_CACHED)) {
    534      1.103       mrg 		printf("%s: flush timeout %p, at %p\n", __func__,
    535       1.55       eeh 			(void *)(u_long)*sb->sb_flush,
    536       1.55       eeh 			(void *)(u_long)sb->sb_flushpa); /* panic? */
    537        1.2       eeh #ifdef DDB
    538        1.2       eeh 		Debugger();
    539        1.2       eeh #endif
    540        1.2       eeh 	}
    541        1.2       eeh #endif
    542      1.103       mrg 	DPRINTF(IDB_IOMMU, ("%s: flushed\n", __func__));
    543       1.55       eeh 	return (*sb->sb_flush);
    544        1.7       mrg }
    545        1.7       mrg 
    546        1.7       mrg /*
    547        1.7       mrg  * IOMMU DVMA operations, common to SBUS and PCI.
    548        1.7       mrg  */
    549        1.7       mrg int
    550       1.85  nakayama iommu_dvmamap_load(bus_dma_tag_t t, bus_dmamap_t map, void *buf,
    551       1.85  nakayama 	bus_size_t buflen, struct proc *p, int flags)
    552        1.7       mrg {
    553       1.85  nakayama 	struct strbuf_ctl *sb = (struct strbuf_ctl *)map->_dm_cookie;
    554       1.55       eeh 	struct iommu_state *is = sb->sb_is;
    555       1.91  nakayama 	int err, needsflush;
    556        1.7       mrg 	bus_size_t sgsize;
    557        1.7       mrg 	paddr_t curaddr;
    558       1.90  nakayama 	u_long dvmaddr, sgstart, sgend, bmask;
    559       1.71   tsutsui 	bus_size_t align, boundary, len;
    560        1.7       mrg 	vaddr_t vaddr = (vaddr_t)buf;
    561       1.40       eeh 	int seg;
    562       1.58       chs 	struct pmap *pmap;
    563      1.103       mrg 	int slot;
    564        1.7       mrg 
    565        1.7       mrg 	if (map->dm_nsegs) {
    566        1.7       mrg 		/* Already in use?? */
    567        1.7       mrg #ifdef DIAGNOSTIC
    568        1.7       mrg 		printf("iommu_dvmamap_load: map still in use\n");
    569        1.7       mrg #endif
    570        1.7       mrg 		bus_dmamap_unload(t, map);
    571        1.7       mrg 	}
    572       1.58       chs 
    573        1.7       mrg 	/*
    574        1.7       mrg 	 * Make sure that on error condition we return "no valid mappings".
    575        1.7       mrg 	 */
    576        1.7       mrg 	map->dm_nsegs = 0;
    577       1.96  nakayama 	KASSERT(map->dm_maxsegsz <= map->_dm_maxmaxsegsz);
    578       1.96  nakayama 
    579        1.7       mrg 	if (buflen > map->_dm_size) {
    580       1.22       mrg 		DPRINTF(IDB_BUSDMA,
    581        1.7       mrg 		    ("iommu_dvmamap_load(): error %d > %d -- "
    582       1.25       mrg 		     "map size exceeded!\n", (int)buflen, (int)map->_dm_size));
    583        1.7       mrg 		return (EINVAL);
    584        1.7       mrg 	}
    585        1.7       mrg 
    586        1.7       mrg 	sgsize = round_page(buflen + ((int)vaddr & PGOFSET));
    587       1.20       mrg 
    588        1.7       mrg 	/*
    589       1.21       eeh 	 * A boundary presented to bus_dmamem_alloc() takes precedence
    590       1.21       eeh 	 * over boundary in the map.
    591        1.7       mrg 	 */
    592       1.21       eeh 	if ((boundary = (map->dm_segs[0]._ds_boundary)) == 0)
    593       1.21       eeh 		boundary = map->_dm_boundary;
    594       1.64   thorpej 	align = max(map->dm_segs[0]._ds_align, PAGE_SIZE);
    595       1.58       chs 
    596       1.58       chs 	/*
    597       1.58       chs 	 * If our segment size is larger than the boundary we need to
    598       1.40       eeh 	 * split the transfer up int little pieces ourselves.
    599       1.40       eeh 	 */
    600      1.103       mrg 	KASSERT(is->is_dvmamap);
    601      1.107       mrg 	mutex_enter(&is->is_lock);
    602       1.58       chs 	err = extent_alloc(is->is_dvmamap, sgsize, align,
    603       1.71   tsutsui 	    (sgsize > boundary) ? 0 : boundary,
    604       1.71   tsutsui 	    EX_NOWAIT|EX_BOUNDZERO, &dvmaddr);
    605      1.107       mrg 	mutex_exit(&is->is_lock);
    606        1.7       mrg 
    607        1.7       mrg #ifdef DEBUG
    608       1.71   tsutsui 	if (err || (dvmaddr == (u_long)-1)) {
    609        1.7       mrg 		printf("iommu_dvmamap_load(): extent_alloc(%d, %x) failed!\n",
    610       1.25       mrg 		    (int)sgsize, flags);
    611       1.40       eeh #ifdef DDB
    612        1.7       mrg 		Debugger();
    613       1.40       eeh #endif
    614       1.58       chs 	}
    615       1.58       chs #endif
    616       1.11       eeh 	if (err != 0)
    617       1.11       eeh 		return (err);
    618       1.11       eeh 
    619       1.65  nakayama 	if (dvmaddr == (u_long)-1)
    620        1.7       mrg 		return (ENOMEM);
    621        1.7       mrg 
    622       1.40       eeh 	/* Set the active DVMA map */
    623       1.40       eeh 	map->_dm_dvmastart = dvmaddr;
    624       1.40       eeh 	map->_dm_dvmasize = sgsize;
    625       1.40       eeh 
    626       1.40       eeh 	/*
    627       1.40       eeh 	 * Now split the DVMA range into segments, not crossing
    628       1.40       eeh 	 * the boundary.
    629       1.40       eeh 	 */
    630       1.40       eeh 	seg = 0;
    631       1.40       eeh 	sgstart = dvmaddr + (vaddr & PGOFSET);
    632       1.40       eeh 	sgend = sgstart + buflen - 1;
    633       1.40       eeh 	map->dm_segs[seg].ds_addr = sgstart;
    634       1.71   tsutsui 	DPRINTF(IDB_INFO, ("iommu_dvmamap_load: boundary %lx boundary - 1 %lx "
    635       1.71   tsutsui 	    "~(boundary - 1) %lx\n", (long)boundary, (long)(boundary - 1),
    636       1.71   tsutsui 	    (long)~(boundary - 1)));
    637       1.90  nakayama 	bmask = ~(boundary - 1);
    638       1.96  nakayama 	while ((sgstart & bmask) != (sgend & bmask) ||
    639       1.96  nakayama 	       sgend - sgstart + 1 > map->dm_maxsegsz) {
    640       1.96  nakayama 		/* Oops. We crossed a boundary or large seg. Split the xfer. */
    641       1.96  nakayama 		len = map->dm_maxsegsz;
    642       1.96  nakayama 		if ((sgstart & bmask) != (sgend & bmask))
    643       1.96  nakayama 			len = min(len, boundary - (sgstart & (boundary - 1)));
    644       1.71   tsutsui 		map->dm_segs[seg].ds_len = len;
    645       1.40       eeh 		DPRINTF(IDB_INFO, ("iommu_dvmamap_load: "
    646       1.71   tsutsui 		    "seg %d start %lx size %lx\n", seg,
    647       1.71   tsutsui 		    (long)map->dm_segs[seg].ds_addr,
    648       1.71   tsutsui 		    (long)map->dm_segs[seg].ds_len));
    649       1.53       eeh 		if (++seg >= map->_dm_segcnt) {
    650       1.40       eeh 			/* Too many segments.  Fail the operation. */
    651       1.40       eeh 			DPRINTF(IDB_INFO, ("iommu_dvmamap_load: "
    652       1.71   tsutsui 			    "too many segments %d\n", seg));
    653      1.107       mrg 			mutex_enter(&is->is_lock);
    654       1.40       eeh 			err = extent_free(is->is_dvmamap,
    655       1.71   tsutsui 			    dvmaddr, sgsize, EX_NOWAIT);
    656       1.40       eeh 			map->_dm_dvmastart = 0;
    657       1.40       eeh 			map->_dm_dvmasize = 0;
    658      1.107       mrg 			mutex_exit(&is->is_lock);
    659       1.95  nakayama 			if (err != 0)
    660       1.95  nakayama 				printf("warning: %s: %" PRId64
    661       1.95  nakayama 				    " of DVMA space lost\n", __func__, sgsize);
    662       1.80       mrg 			return (EFBIG);
    663       1.40       eeh 		}
    664       1.71   tsutsui 		sgstart += len;
    665       1.40       eeh 		map->dm_segs[seg].ds_addr = sgstart;
    666       1.40       eeh 	}
    667       1.40       eeh 	map->dm_segs[seg].ds_len = sgend - sgstart + 1;
    668       1.40       eeh 	DPRINTF(IDB_INFO, ("iommu_dvmamap_load: "
    669       1.71   tsutsui 	    "seg %d start %lx size %lx\n", seg,
    670       1.71   tsutsui 	    (long)map->dm_segs[seg].ds_addr, (long)map->dm_segs[seg].ds_len));
    671       1.71   tsutsui 	map->dm_nsegs = seg + 1;
    672        1.7       mrg 	map->dm_mapsize = buflen;
    673        1.7       mrg 
    674        1.7       mrg 	if (p != NULL)
    675        1.7       mrg 		pmap = p->p_vmspace->vm_map.pmap;
    676        1.7       mrg 	else
    677        1.7       mrg 		pmap = pmap_kernel();
    678        1.7       mrg 
    679       1.91  nakayama 	needsflush = 0;
    680        1.7       mrg 	for (; buflen > 0; ) {
    681       1.58       chs 
    682        1.7       mrg 		/*
    683        1.7       mrg 		 * Get the physical address for this page.
    684        1.7       mrg 		 */
    685        1.7       mrg 		if (pmap_extract(pmap, (vaddr_t)vaddr, &curaddr) == FALSE) {
    686       1.74    petrov #ifdef DIAGNOSTIC
    687       1.74    petrov 			printf("iommu_dvmamap_load: pmap_extract failed %lx\n", vaddr);
    688       1.74    petrov #endif
    689        1.7       mrg 			bus_dmamap_unload(t, map);
    690        1.7       mrg 			return (-1);
    691        1.7       mrg 		}
    692        1.7       mrg 
    693        1.7       mrg 		/*
    694        1.7       mrg 		 * Compute the segment size, and adjust counts.
    695        1.7       mrg 		 */
    696       1.64   thorpej 		sgsize = PAGE_SIZE - ((u_long)vaddr & PGOFSET);
    697        1.7       mrg 		if (buflen < sgsize)
    698        1.7       mrg 			sgsize = buflen;
    699        1.7       mrg 
    700       1.22       mrg 		DPRINTF(IDB_BUSDMA,
    701       1.36       eeh 		    ("iommu_dvmamap_load: map %p loading va %p "
    702       1.71   tsutsui 		    "dva %lx at pa %lx\n",
    703       1.71   tsutsui 		    map, (void *)vaddr, (long)dvmaddr,
    704       1.87  nakayama 		    (long)trunc_page(curaddr)));
    705       1.55       eeh 		iommu_enter(sb, trunc_page(dvmaddr), trunc_page(curaddr),
    706       1.90  nakayama 		    flags | IOTTE_DEBUG(0x4000));
    707       1.91  nakayama 		needsflush = 1;
    708       1.58       chs 
    709        1.7       mrg 		vaddr += sgsize;
    710        1.7       mrg 		buflen -= sgsize;
    711      1.103       mrg 
    712      1.103       mrg 		/* Flush cache if necessary. */
    713      1.103       mrg 		slot = IOTSBSLOT(trunc_page(dvmaddr), is->is_tsbsize);
    714      1.103       mrg 		if ((is->is_flags & IOMMU_FLUSH_CACHE) &&
    715      1.103       mrg 		    (buflen <= 0 || (slot % 8) == 7))
    716      1.103       mrg 			IOMMUREG_WRITE(is, iommu_cache_flush,
    717      1.103       mrg 			    is->is_ptsb + slot * 8);
    718      1.103       mrg 
    719      1.103       mrg 		dvmaddr += PAGE_SIZE;
    720        1.7       mrg 	}
    721       1.91  nakayama 	if (needsflush)
    722       1.91  nakayama 		iommu_strbuf_flush_done(sb);
    723       1.45       eeh #ifdef DIAGNOSTIC
    724       1.45       eeh 	for (seg = 0; seg < map->dm_nsegs; seg++) {
    725       1.45       eeh 		if (map->dm_segs[seg].ds_addr < is->is_dvmabase ||
    726       1.45       eeh 			map->dm_segs[seg].ds_addr > is->is_dvmaend) {
    727       1.45       eeh 			printf("seg %d dvmaddr %lx out of range %x - %x\n",
    728       1.71   tsutsui 			    seg, (long)map->dm_segs[seg].ds_addr,
    729       1.71   tsutsui 			    is->is_dvmabase, is->is_dvmaend);
    730       1.57       chs #ifdef DDB
    731       1.45       eeh 			Debugger();
    732       1.57       chs #endif
    733       1.45       eeh 		}
    734       1.45       eeh 	}
    735       1.45       eeh #endif
    736        1.7       mrg 	return (0);
    737        1.7       mrg }
    738        1.7       mrg 
    739        1.7       mrg 
    740        1.7       mrg void
    741       1.85  nakayama iommu_dvmamap_unload(bus_dma_tag_t t, bus_dmamap_t map)
    742        1.7       mrg {
    743       1.85  nakayama 	struct strbuf_ctl *sb = (struct strbuf_ctl *)map->_dm_cookie;
    744       1.55       eeh 	struct iommu_state *is = sb->sb_is;
    745      1.107       mrg 	int error;
    746       1.70  christos 	bus_size_t sgsize = map->_dm_dvmasize;
    747        1.7       mrg 
    748       1.40       eeh 	/* Flush the iommu */
    749  1.107.2.1  jdolecek 	if (!map->_dm_dvmastart)
    750  1.107.2.1  jdolecek 		panic("%s: error dvmastart is zero!\n", __func__);
    751       1.40       eeh 	iommu_remove(is, map->_dm_dvmastart, map->_dm_dvmasize);
    752        1.7       mrg 
    753       1.23       eeh 	/* Flush the caches */
    754       1.23       eeh 	bus_dmamap_unload(t->_parent, map);
    755       1.23       eeh 
    756      1.107       mrg 	mutex_enter(&is->is_lock);
    757       1.58       chs 	error = extent_free(is->is_dvmamap, map->_dm_dvmastart,
    758       1.40       eeh 		map->_dm_dvmasize, EX_NOWAIT);
    759       1.43       eeh 	map->_dm_dvmastart = 0;
    760       1.43       eeh 	map->_dm_dvmasize = 0;
    761      1.107       mrg 	mutex_exit(&is->is_lock);
    762        1.7       mrg 	if (error != 0)
    763       1.95  nakayama 		printf("warning: %s: %" PRId64 " of DVMA space lost\n",
    764       1.95  nakayama 		    __func__, sgsize);
    765       1.40       eeh 
    766       1.40       eeh 	/* Clear the map */
    767        1.9       eeh }
    768        1.9       eeh 
    769        1.9       eeh 
    770        1.9       eeh int
    771       1.85  nakayama iommu_dvmamap_load_raw(bus_dma_tag_t t, bus_dmamap_t map,
    772       1.85  nakayama 	bus_dma_segment_t *segs, int nsegs, bus_size_t size, int flags)
    773        1.9       eeh {
    774       1.85  nakayama 	struct strbuf_ctl *sb = (struct strbuf_ctl *)map->_dm_cookie;
    775       1.55       eeh 	struct iommu_state *is = sb->sb_is;
    776       1.58       chs 	struct vm_page *pg;
    777      1.107       mrg 	int i, j;
    778       1.26    martin 	int left;
    779       1.91  nakayama 	int err, needsflush;
    780        1.9       eeh 	bus_size_t sgsize;
    781        1.9       eeh 	paddr_t pa;
    782       1.21       eeh 	bus_size_t boundary, align;
    783       1.90  nakayama 	u_long dvmaddr, sgstart, sgend, bmask;
    784       1.58       chs 	struct pglist *pglist;
    785       1.90  nakayama 	const int pagesz = PAGE_SIZE;
    786      1.103       mrg 	int slot;
    787       1.90  nakayama #ifdef DEBUG
    788       1.90  nakayama 	int npg = 0;
    789       1.90  nakayama #endif
    790        1.9       eeh 
    791        1.9       eeh 	if (map->dm_nsegs) {
    792        1.9       eeh 		/* Already in use?? */
    793        1.9       eeh #ifdef DIAGNOSTIC
    794        1.9       eeh 		printf("iommu_dvmamap_load_raw: map still in use\n");
    795        1.9       eeh #endif
    796        1.9       eeh 		bus_dmamap_unload(t, map);
    797        1.9       eeh 	}
    798       1.40       eeh 
    799       1.40       eeh 	/*
    800       1.40       eeh 	 * A boundary presented to bus_dmamem_alloc() takes precedence
    801       1.40       eeh 	 * over boundary in the map.
    802       1.40       eeh 	 */
    803       1.40       eeh 	if ((boundary = segs[0]._ds_boundary) == 0)
    804       1.40       eeh 		boundary = map->_dm_boundary;
    805       1.40       eeh 
    806       1.45       eeh 	align = max(segs[0]._ds_align, pagesz);
    807       1.40       eeh 
    808        1.9       eeh 	/*
    809        1.9       eeh 	 * Make sure that on error condition we return "no valid mappings".
    810        1.9       eeh 	 */
    811        1.9       eeh 	map->dm_nsegs = 0;
    812       1.26    martin 	/* Count up the total number of pages we need */
    813       1.93  nakayama 	pa = trunc_page(segs[0].ds_addr);
    814       1.26    martin 	sgsize = 0;
    815       1.40       eeh 	left = size;
    816       1.93  nakayama 	for (i = 0; left > 0 && i < nsegs; i++) {
    817       1.26    martin 		if (round_page(pa) != round_page(segs[i].ds_addr))
    818       1.93  nakayama 			sgsize = round_page(sgsize) +
    819       1.93  nakayama 			    (segs[i].ds_addr & PGOFSET);
    820       1.40       eeh 		sgsize += min(left, segs[i].ds_len);
    821       1.40       eeh 		left -= segs[i].ds_len;
    822       1.26    martin 		pa = segs[i].ds_addr + segs[i].ds_len;
    823       1.26    martin 	}
    824       1.93  nakayama 	sgsize = round_page(sgsize);
    825        1.9       eeh 
    826      1.107       mrg 	mutex_enter(&is->is_lock);
    827       1.58       chs 	/*
    828       1.58       chs 	 * If our segment size is larger than the boundary we need to
    829       1.45       eeh 	 * split the transfer up into little pieces ourselves.
    830        1.9       eeh 	 */
    831       1.40       eeh 	err = extent_alloc(is->is_dvmamap, sgsize, align,
    832       1.40       eeh 		(sgsize > boundary) ? 0 : boundary,
    833       1.40       eeh 		((flags & BUS_DMA_NOWAIT) == 0 ? EX_WAITOK : EX_NOWAIT) |
    834       1.54       eeh 		EX_BOUNDZERO, &dvmaddr);
    835      1.107       mrg 	mutex_exit(&is->is_lock);
    836        1.9       eeh 
    837        1.9       eeh 	if (err != 0)
    838        1.9       eeh 		return (err);
    839        1.9       eeh 
    840        1.9       eeh #ifdef DEBUG
    841       1.65  nakayama 	if (dvmaddr == (u_long)-1)
    842       1.58       chs 	{
    843        1.9       eeh 		printf("iommu_dvmamap_load_raw(): extent_alloc(%d, %x) failed!\n",
    844       1.25       mrg 		    (int)sgsize, flags);
    845       1.57       chs #ifdef DDB
    846        1.9       eeh 		Debugger();
    847       1.57       chs #endif
    848       1.58       chs 	}
    849       1.58       chs #endif
    850       1.65  nakayama 	if (dvmaddr == (u_long)-1)
    851        1.9       eeh 		return (ENOMEM);
    852        1.9       eeh 
    853       1.40       eeh 	/* Set the active DVMA map */
    854       1.40       eeh 	map->_dm_dvmastart = dvmaddr;
    855       1.40       eeh 	map->_dm_dvmasize = sgsize;
    856       1.40       eeh 
    857       1.90  nakayama 	bmask = ~(boundary - 1);
    858       1.58       chs 	if ((pglist = segs[0]._ds_mlist) == NULL) {
    859       1.92  nakayama 		u_long prev_va = 0UL, last_va = dvmaddr;
    860       1.45       eeh 		paddr_t prev_pa = 0;
    861       1.45       eeh 		int end = 0, offset;
    862       1.92  nakayama 		bus_size_t len = size;
    863       1.45       eeh 
    864       1.26    martin 		/*
    865       1.45       eeh 		 * This segs is made up of individual physical
    866       1.58       chs 		 *  segments, probably by _bus_dmamap_load_uio() or
    867       1.26    martin 		 * _bus_dmamap_load_mbuf().  Ignore the mlist and
    868       1.45       eeh 		 * load each one individually.
    869       1.26    martin 		 */
    870       1.45       eeh 		j = 0;
    871       1.91  nakayama 		needsflush = 0;
    872       1.45       eeh 		for (i = 0; i < nsegs ; i++) {
    873       1.40       eeh 
    874       1.45       eeh 			pa = segs[i].ds_addr;
    875       1.45       eeh 			offset = (pa & PGOFSET);
    876       1.45       eeh 			pa = trunc_page(pa);
    877       1.45       eeh 			dvmaddr = trunc_page(dvmaddr);
    878       1.92  nakayama 			left = min(len, segs[i].ds_len);
    879       1.45       eeh 
    880       1.45       eeh 			DPRINTF(IDB_INFO, ("iommu_dvmamap_load_raw: converting "
    881       1.58       chs 				"physseg %d start %lx size %lx\n", i,
    882       1.61    martin 				(long)segs[i].ds_addr, (long)segs[i].ds_len));
    883       1.26    martin 
    884       1.58       chs 			if ((pa == prev_pa) &&
    885       1.47       eeh 				((offset != 0) || (end != offset))) {
    886       1.45       eeh 				/* We can re-use this mapping */
    887       1.45       eeh 				dvmaddr = prev_va;
    888       1.45       eeh 			}
    889       1.29    martin 
    890       1.45       eeh 			sgstart = dvmaddr + offset;
    891       1.45       eeh 			sgend = sgstart + left - 1;
    892       1.26    martin 
    893       1.45       eeh 			/* Are the segments virtually adjacent? */
    894       1.58       chs 			if ((j > 0) && (end == offset) &&
    895       1.96  nakayama 			    ((offset == 0) || (pa == prev_pa)) &&
    896       1.96  nakayama 			    (map->dm_segs[j-1].ds_len + left <=
    897       1.96  nakayama 			     map->dm_maxsegsz)) {
    898       1.45       eeh 				/* Just append to the previous segment. */
    899       1.45       eeh 				map->dm_segs[--j].ds_len += left;
    900       1.93  nakayama 				/* Restore sgstart for boundary check */
    901       1.93  nakayama 				sgstart = map->dm_segs[j].ds_addr;
    902       1.45       eeh 				DPRINTF(IDB_INFO, ("iommu_dvmamap_load_raw: "
    903       1.45       eeh 					"appending seg %d start %lx size %lx\n", j,
    904       1.58       chs 					(long)map->dm_segs[j].ds_addr,
    905       1.61    martin 					(long)map->dm_segs[j].ds_len));
    906       1.45       eeh 			} else {
    907       1.53       eeh 				if (j >= map->_dm_segcnt) {
    908       1.92  nakayama 					iommu_remove(is, map->_dm_dvmastart,
    909       1.92  nakayama 					    last_va - map->_dm_dvmastart);
    910       1.92  nakayama 					goto fail;
    911       1.53       eeh 				}
    912       1.45       eeh 				map->dm_segs[j].ds_addr = sgstart;
    913       1.45       eeh 				map->dm_segs[j].ds_len = left;
    914       1.45       eeh 				DPRINTF(IDB_INFO, ("iommu_dvmamap_load_raw: "
    915       1.45       eeh 					"seg %d start %lx size %lx\n", j,
    916       1.48       eeh 					(long)map->dm_segs[j].ds_addr,
    917       1.61    martin 					(long)map->dm_segs[j].ds_len));
    918       1.40       eeh 			}
    919       1.45       eeh 			end = (offset + left) & PGOFSET;
    920       1.40       eeh 
    921       1.40       eeh 			/* Check for boundary issues */
    922       1.90  nakayama 			while ((sgstart & bmask) != (sgend & bmask)) {
    923       1.40       eeh 				/* Need a new segment. */
    924       1.40       eeh 				map->dm_segs[j].ds_len =
    925       1.53       eeh 					boundary - (sgstart & (boundary - 1));
    926       1.40       eeh 				DPRINTF(IDB_INFO, ("iommu_dvmamap_load_raw: "
    927       1.40       eeh 					"seg %d start %lx size %lx\n", j,
    928       1.58       chs 					(long)map->dm_segs[j].ds_addr,
    929       1.61    martin 					(long)map->dm_segs[j].ds_len));
    930       1.53       eeh 				if (++j >= map->_dm_segcnt) {
    931       1.92  nakayama 					iommu_remove(is, map->_dm_dvmastart,
    932       1.92  nakayama 					    last_va - map->_dm_dvmastart);
    933       1.92  nakayama 					goto fail;
    934       1.40       eeh 				}
    935       1.93  nakayama 				sgstart += map->dm_segs[j-1].ds_len;
    936       1.40       eeh 				map->dm_segs[j].ds_addr = sgstart;
    937       1.40       eeh 				map->dm_segs[j].ds_len = sgend - sgstart + 1;
    938       1.40       eeh 			}
    939       1.40       eeh 
    940       1.26    martin 			if (sgsize == 0)
    941       1.26    martin 				panic("iommu_dmamap_load_raw: size botch");
    942       1.40       eeh 
    943       1.45       eeh 			/* Now map a series of pages. */
    944       1.51       eeh 			while (dvmaddr <= sgend) {
    945       1.45       eeh 				DPRINTF(IDB_BUSDMA,
    946       1.45       eeh 					("iommu_dvmamap_load_raw: map %p "
    947       1.45       eeh 						"loading va %lx at pa %lx\n",
    948       1.45       eeh 						map, (long)dvmaddr,
    949       1.45       eeh 						(long)(pa)));
    950       1.45       eeh 				/* Enter it if we haven't before. */
    951       1.91  nakayama 				if (prev_va != dvmaddr) {
    952       1.55       eeh 					iommu_enter(sb, prev_va = dvmaddr,
    953       1.90  nakayama 					    prev_pa = pa,
    954       1.90  nakayama 					    flags | IOTTE_DEBUG(++npg << 12));
    955       1.91  nakayama 					needsflush = 1;
    956      1.103       mrg 
    957      1.103       mrg 					/* Flush cache if necessary. */
    958      1.103       mrg 					slot = IOTSBSLOT(trunc_page(dvmaddr), is->is_tsbsize);
    959      1.103       mrg 					if ((is->is_flags & IOMMU_FLUSH_CACHE) &&
    960      1.103       mrg 					    ((dvmaddr + pagesz) > sgend || (slot % 8) == 7))
    961      1.103       mrg 						IOMMUREG_WRITE(is, iommu_cache_flush,
    962      1.103       mrg 						    is->is_ptsb + slot * 8);
    963       1.91  nakayama 				}
    964      1.103       mrg 
    965       1.45       eeh 				dvmaddr += pagesz;
    966       1.45       eeh 				pa += pagesz;
    967       1.92  nakayama 				last_va = dvmaddr;
    968       1.45       eeh 			}
    969       1.45       eeh 
    970       1.92  nakayama 			len -= left;
    971       1.45       eeh 			++j;
    972       1.26    martin 		}
    973       1.91  nakayama 		if (needsflush)
    974       1.91  nakayama 			iommu_strbuf_flush_done(sb);
    975       1.45       eeh 
    976       1.92  nakayama 		map->dm_mapsize = size;
    977       1.45       eeh 		map->dm_nsegs = j;
    978       1.45       eeh #ifdef DIAGNOSTIC
    979       1.45       eeh 		{ int seg;
    980       1.45       eeh 	for (seg = 0; seg < map->dm_nsegs; seg++) {
    981       1.45       eeh 		if (map->dm_segs[seg].ds_addr < is->is_dvmabase ||
    982      1.103       mrg 		    map->dm_segs[seg].ds_addr > is->is_dvmaend) {
    983       1.45       eeh 			printf("seg %d dvmaddr %lx out of range %x - %x\n",
    984       1.58       chs 				seg, (long)map->dm_segs[seg].ds_addr,
    985       1.45       eeh 				is->is_dvmabase, is->is_dvmaend);
    986       1.57       chs #ifdef DDB
    987       1.45       eeh 			Debugger();
    988       1.57       chs #endif
    989       1.45       eeh 		}
    990       1.45       eeh 	}
    991       1.45       eeh 		}
    992       1.45       eeh #endif
    993       1.26    martin 		return (0);
    994       1.26    martin 	}
    995       1.58       chs 
    996        1.9       eeh 	/*
    997       1.40       eeh 	 * This was allocated with bus_dmamem_alloc.
    998       1.58       chs 	 * The pages are on a `pglist'.
    999        1.9       eeh 	 */
   1000       1.26    martin 	i = 0;
   1001       1.40       eeh 	sgstart = dvmaddr;
   1002       1.40       eeh 	sgend = sgstart + size - 1;
   1003       1.40       eeh 	map->dm_segs[i].ds_addr = sgstart;
   1004       1.90  nakayama 	while ((sgstart & bmask) != (sgend & bmask)) {
   1005       1.40       eeh 		/* Oops.  We crossed a boundary.  Split the xfer. */
   1006       1.53       eeh 		map->dm_segs[i].ds_len = boundary - (sgstart & (boundary - 1));
   1007       1.40       eeh 		DPRINTF(IDB_INFO, ("iommu_dvmamap_load_raw: "
   1008       1.40       eeh 			"seg %d start %lx size %lx\n", i,
   1009       1.48       eeh 			(long)map->dm_segs[i].ds_addr,
   1010       1.61    martin 			(long)map->dm_segs[i].ds_len));
   1011       1.53       eeh 		if (++i >= map->_dm_segcnt) {
   1012       1.40       eeh 			/* Too many segments.  Fail the operation. */
   1013       1.92  nakayama 			goto fail;
   1014       1.40       eeh 		}
   1015       1.93  nakayama 		sgstart += map->dm_segs[i-1].ds_len;
   1016       1.40       eeh 		map->dm_segs[i].ds_addr = sgstart;
   1017       1.40       eeh 	}
   1018       1.40       eeh 	DPRINTF(IDB_INFO, ("iommu_dvmamap_load_raw: "
   1019       1.40       eeh 			"seg %d start %lx size %lx\n", i,
   1020       1.61    martin 			(long)map->dm_segs[i].ds_addr, (long)map->dm_segs[i].ds_len));
   1021       1.40       eeh 	map->dm_segs[i].ds_len = sgend - sgstart + 1;
   1022        1.9       eeh 
   1023       1.91  nakayama 	needsflush = 0;
   1024       1.83        ad 	TAILQ_FOREACH(pg, pglist, pageq.queue) {
   1025        1.9       eeh 		if (sgsize == 0)
   1026        1.9       eeh 			panic("iommu_dmamap_load_raw: size botch");
   1027       1.58       chs 		pa = VM_PAGE_TO_PHYS(pg);
   1028        1.9       eeh 
   1029       1.22       mrg 		DPRINTF(IDB_BUSDMA,
   1030        1.9       eeh 		    ("iommu_dvmamap_load_raw: map %p loading va %lx at pa %lx\n",
   1031        1.9       eeh 		    map, (long)dvmaddr, (long)(pa)));
   1032       1.90  nakayama 		iommu_enter(sb, dvmaddr, pa, flags | IOTTE_DEBUG(0x8000));
   1033       1.91  nakayama 		needsflush = 1;
   1034       1.58       chs 
   1035      1.103       mrg 		sgsize -= pagesz;
   1036      1.103       mrg 
   1037      1.103       mrg 		/* Flush cache if necessary. */
   1038      1.103       mrg 		slot = IOTSBSLOT(trunc_page(dvmaddr), is->is_tsbsize);
   1039      1.103       mrg 		if ((is->is_flags & IOMMU_FLUSH_CACHE) &&
   1040      1.103       mrg 		    (sgsize == 0 || (slot % 8) == 7))
   1041      1.103       mrg 			IOMMUREG_WRITE(is, iommu_cache_flush,
   1042      1.103       mrg 			    is->is_ptsb + slot * 8);
   1043      1.103       mrg 
   1044      1.102       mrg 		dvmaddr += pagesz;
   1045        1.9       eeh 	}
   1046       1.91  nakayama 	if (needsflush)
   1047       1.91  nakayama 		iommu_strbuf_flush_done(sb);
   1048       1.40       eeh 	map->dm_mapsize = size;
   1049       1.40       eeh 	map->dm_nsegs = i+1;
   1050       1.45       eeh #ifdef DIAGNOSTIC
   1051       1.45       eeh 	{ int seg;
   1052       1.45       eeh 	for (seg = 0; seg < map->dm_nsegs; seg++) {
   1053       1.45       eeh 		if (map->dm_segs[seg].ds_addr < is->is_dvmabase ||
   1054       1.45       eeh 			map->dm_segs[seg].ds_addr > is->is_dvmaend) {
   1055       1.45       eeh 			printf("seg %d dvmaddr %lx out of range %x - %x\n",
   1056       1.58       chs 				seg, (long)map->dm_segs[seg].ds_addr,
   1057       1.45       eeh 				is->is_dvmabase, is->is_dvmaend);
   1058       1.57       chs #ifdef DDB
   1059       1.45       eeh 			Debugger();
   1060       1.57       chs #endif
   1061       1.45       eeh 		}
   1062       1.45       eeh 	}
   1063       1.45       eeh 	}
   1064       1.45       eeh #endif
   1065        1.9       eeh 	return (0);
   1066       1.92  nakayama 
   1067       1.92  nakayama fail:
   1068      1.107       mrg 	mutex_enter(&is->is_lock);
   1069       1.92  nakayama 	err = extent_free(is->is_dvmamap, map->_dm_dvmastart, sgsize,
   1070       1.92  nakayama 	    EX_NOWAIT);
   1071       1.92  nakayama 	map->_dm_dvmastart = 0;
   1072       1.92  nakayama 	map->_dm_dvmasize = 0;
   1073      1.107       mrg 	mutex_exit(&is->is_lock);
   1074       1.95  nakayama 	if (err != 0)
   1075       1.95  nakayama 		printf("warning: %s: %" PRId64 " of DVMA space lost\n",
   1076       1.95  nakayama 		    __func__, sgsize);
   1077       1.92  nakayama 	return (EFBIG);
   1078        1.7       mrg }
   1079        1.7       mrg 
   1080       1.67    petrov 
   1081       1.67    petrov /*
   1082       1.67    petrov  * Flush an individual dma segment, returns non-zero if the streaming buffers
   1083       1.67    petrov  * need flushing afterwards.
   1084       1.67    petrov  */
   1085       1.67    petrov static int
   1086       1.67    petrov iommu_dvmamap_sync_range(struct strbuf_ctl *sb, vaddr_t va, bus_size_t len)
   1087       1.67    petrov {
   1088       1.67    petrov 	vaddr_t vaend;
   1089       1.67    petrov 	struct iommu_state *is = sb->sb_is;
   1090       1.67    petrov 
   1091       1.67    petrov #ifdef DIAGNOSTIC
   1092       1.67    petrov 	if (va < is->is_dvmabase || va > is->is_dvmaend)
   1093       1.67    petrov 		panic("invalid va: %llx", (long long)va);
   1094       1.67    petrov #endif
   1095       1.67    petrov 
   1096       1.67    petrov 	if ((is->is_tsb[IOTSBSLOT(va, is->is_tsbsize)] & IOTTE_STREAM) == 0) {
   1097      1.103       mrg 		DPRINTF(IDB_SYNC,
   1098       1.67    petrov 			("iommu_dvmamap_sync_range: attempting to flush "
   1099       1.67    petrov 			 "non-streaming entry\n"));
   1100       1.67    petrov 		return (0);
   1101       1.67    petrov 	}
   1102       1.67    petrov 
   1103       1.90  nakayama 	vaend = round_page(va + len) - 1;
   1104       1.87  nakayama 	va = trunc_page(va);
   1105       1.67    petrov 
   1106       1.67    petrov #ifdef DIAGNOSTIC
   1107       1.67    petrov 	if (va < is->is_dvmabase || vaend > is->is_dvmaend)
   1108       1.67    petrov 		panic("invalid va range: %llx to %llx (%x to %x)",
   1109       1.67    petrov 		    (long long)va, (long long)vaend,
   1110       1.67    petrov 		    is->is_dvmabase,
   1111       1.67    petrov 		    is->is_dvmaend);
   1112       1.67    petrov #endif
   1113       1.67    petrov 
   1114       1.67    petrov 	for ( ; va <= vaend; va += PAGE_SIZE) {
   1115      1.103       mrg 		DPRINTF(IDB_SYNC,
   1116       1.67    petrov 		    ("iommu_dvmamap_sync_range: flushing va %p\n",
   1117       1.67    petrov 		    (void *)(u_long)va));
   1118       1.67    petrov 		iommu_strbuf_flush(sb, va);
   1119       1.67    petrov 	}
   1120       1.67    petrov 
   1121       1.67    petrov 	return (1);
   1122       1.67    petrov }
   1123       1.67    petrov 
   1124       1.85  nakayama static void
   1125       1.85  nakayama _iommu_dvmamap_sync(bus_dma_tag_t t, bus_dmamap_t map, bus_addr_t offset,
   1126       1.85  nakayama 	bus_size_t len, int ops)
   1127        1.7       mrg {
   1128       1.85  nakayama 	struct strbuf_ctl *sb = (struct strbuf_ctl *)map->_dm_cookie;
   1129       1.67    petrov 	bus_size_t count;
   1130       1.67    petrov 	int i, needsflush = 0;
   1131       1.63    petrov 
   1132       1.63    petrov 	if (!sb->sb_flush)
   1133       1.63    petrov 		return;
   1134        1.7       mrg 
   1135       1.67    petrov 	for (i = 0; i < map->dm_nsegs; i++) {
   1136       1.67    petrov 		if (offset < map->dm_segs[i].ds_len)
   1137       1.67    petrov 			break;
   1138       1.67    petrov 		offset -= map->dm_segs[i].ds_len;
   1139       1.67    petrov 	}
   1140       1.60    petrov 
   1141       1.67    petrov 	if (i == map->dm_nsegs)
   1142      1.103       mrg 		panic("%s: segment too short %llu", __func__,
   1143       1.68    martin 		    (unsigned long long)offset);
   1144       1.60    petrov 
   1145       1.62    petrov 	if (ops & (BUS_DMASYNC_PREREAD | BUS_DMASYNC_POSTWRITE)) {
   1146       1.60    petrov 		/* Nothing to do */;
   1147       1.60    petrov 	}
   1148       1.60    petrov 
   1149       1.62    petrov 	if (ops & (BUS_DMASYNC_POSTREAD | BUS_DMASYNC_PREWRITE)) {
   1150       1.67    petrov 
   1151       1.67    petrov 		for (; len > 0 && i < map->dm_nsegs; i++) {
   1152       1.67    petrov 			count = MIN(map->dm_segs[i].ds_len - offset, len);
   1153       1.67    petrov 			if (count > 0 &&
   1154       1.67    petrov 			    iommu_dvmamap_sync_range(sb,
   1155       1.67    petrov 				map->dm_segs[i].ds_addr + offset, count))
   1156       1.67    petrov 				needsflush = 1;
   1157       1.67    petrov 			offset = 0;
   1158       1.67    petrov 			len -= count;
   1159       1.67    petrov 		}
   1160       1.60    petrov #ifdef DIAGNOSTIC
   1161       1.67    petrov 		if (i == map->dm_nsegs && len > 0)
   1162      1.103       mrg 			panic("%s: leftover %llu", __func__,
   1163       1.73  nakayama 			    (unsigned long long)len);
   1164       1.60    petrov #endif
   1165       1.55       eeh 
   1166       1.67    petrov 		if (needsflush)
   1167       1.58       chs 			iommu_strbuf_flush_done(sb);
   1168        1.7       mrg 	}
   1169        1.7       mrg }
   1170        1.7       mrg 
   1171       1.85  nakayama void
   1172       1.85  nakayama iommu_dvmamap_sync(bus_dma_tag_t t, bus_dmamap_t map, bus_addr_t offset,
   1173       1.85  nakayama 	bus_size_t len, int ops)
   1174       1.85  nakayama {
   1175       1.85  nakayama 
   1176       1.89       jdc 	/* If len is 0, then there is nothing to do */
   1177       1.89       jdc 	if (len == 0)
   1178       1.89       jdc 		return;
   1179       1.89       jdc 
   1180       1.85  nakayama 	if (ops & (BUS_DMASYNC_PREREAD | BUS_DMASYNC_PREWRITE)) {
   1181       1.85  nakayama 		/* Flush the CPU then the IOMMU */
   1182       1.85  nakayama 		bus_dmamap_sync(t->_parent, map, offset, len, ops);
   1183       1.85  nakayama 		_iommu_dvmamap_sync(t, map, offset, len, ops);
   1184       1.85  nakayama 	}
   1185       1.85  nakayama 	if (ops & (BUS_DMASYNC_POSTREAD | BUS_DMASYNC_POSTWRITE)) {
   1186       1.85  nakayama 		/* Flush the IOMMU then the CPU */
   1187       1.85  nakayama 		_iommu_dvmamap_sync(t, map, offset, len, ops);
   1188       1.85  nakayama 		bus_dmamap_sync(t->_parent, map, offset, len, ops);
   1189       1.85  nakayama 	}
   1190       1.85  nakayama }
   1191       1.85  nakayama 
   1192        1.7       mrg int
   1193       1.85  nakayama iommu_dvmamem_alloc(bus_dma_tag_t t, bus_size_t size, bus_size_t alignment,
   1194       1.85  nakayama 	bus_size_t boundary, bus_dma_segment_t *segs, int nsegs, int *rsegs,
   1195       1.85  nakayama 	int flags)
   1196        1.7       mrg {
   1197        1.7       mrg 
   1198       1.25       mrg 	DPRINTF(IDB_BUSDMA, ("iommu_dvmamem_alloc: sz %llx align %llx bound %llx "
   1199       1.25       mrg 	   "segp %p flags %d\n", (unsigned long long)size,
   1200       1.25       mrg 	   (unsigned long long)alignment, (unsigned long long)boundary,
   1201       1.25       mrg 	   segs, flags));
   1202        1.7       mrg 	return (bus_dmamem_alloc(t->_parent, size, alignment, boundary,
   1203       1.21       eeh 	    segs, nsegs, rsegs, flags|BUS_DMA_DVMA));
   1204        1.7       mrg }
   1205        1.7       mrg 
   1206        1.7       mrg void
   1207       1.85  nakayama iommu_dvmamem_free(bus_dma_tag_t t, bus_dma_segment_t *segs, int nsegs)
   1208        1.7       mrg {
   1209        1.7       mrg 
   1210       1.22       mrg 	DPRINTF(IDB_BUSDMA, ("iommu_dvmamem_free: segp %p nsegs %d\n",
   1211        1.7       mrg 	    segs, nsegs));
   1212        1.7       mrg 	bus_dmamem_free(t->_parent, segs, nsegs);
   1213        1.7       mrg }
   1214        1.7       mrg 
   1215        1.7       mrg /*
   1216        1.7       mrg  * Map the DVMA mappings into the kernel pmap.
   1217        1.7       mrg  * Check the flags to see whether we're streaming or coherent.
   1218        1.7       mrg  */
   1219        1.7       mrg int
   1220       1.85  nakayama iommu_dvmamem_map(bus_dma_tag_t t, bus_dma_segment_t *segs, int nsegs,
   1221       1.85  nakayama 	size_t size, void **kvap, int flags)
   1222        1.7       mrg {
   1223       1.58       chs 	struct vm_page *pg;
   1224        1.7       mrg 	vaddr_t va;
   1225        1.7       mrg 	bus_addr_t addr;
   1226       1.58       chs 	struct pglist *pglist;
   1227        1.8       mrg 	int cbit;
   1228       1.77      yamt 	const uvm_flag_t kmflags =
   1229       1.77      yamt 	    (flags & BUS_DMA_NOWAIT) != 0 ? UVM_KMF_NOWAIT : 0;
   1230        1.7       mrg 
   1231       1.22       mrg 	DPRINTF(IDB_BUSDMA, ("iommu_dvmamem_map: segp %p nsegs %d size %lx\n",
   1232        1.7       mrg 	    segs, nsegs, size));
   1233        1.7       mrg 
   1234        1.7       mrg 	/*
   1235        1.8       mrg 	 * Allocate some space in the kernel map, and then map these pages
   1236        1.8       mrg 	 * into this space.
   1237        1.7       mrg 	 */
   1238        1.8       mrg 	size = round_page(size);
   1239       1.77      yamt 	va = uvm_km_alloc(kernel_map, size, 0, UVM_KMF_VAONLY | kmflags);
   1240        1.8       mrg 	if (va == 0)
   1241        1.8       mrg 		return (ENOMEM);
   1242        1.7       mrg 
   1243       1.81  christos 	*kvap = (void *)va;
   1244        1.7       mrg 
   1245       1.58       chs 	/*
   1246        1.7       mrg 	 * digest flags:
   1247        1.7       mrg 	 */
   1248        1.7       mrg 	cbit = 0;
   1249        1.7       mrg 	if (flags & BUS_DMA_COHERENT)	/* Disable vcache */
   1250        1.7       mrg 		cbit |= PMAP_NVC;
   1251       1.97     skrll 	if (flags & BUS_DMA_NOCACHE)	/* side effects */
   1252        1.7       mrg 		cbit |= PMAP_NC;
   1253        1.7       mrg 
   1254        1.7       mrg 	/*
   1255        1.8       mrg 	 * Now take this and map it into the CPU.
   1256        1.7       mrg 	 */
   1257       1.58       chs 	pglist = segs[0]._ds_mlist;
   1258       1.83        ad 	TAILQ_FOREACH(pg, pglist, pageq.queue) {
   1259        1.8       mrg #ifdef DIAGNOSTIC
   1260        1.7       mrg 		if (size == 0)
   1261        1.7       mrg 			panic("iommu_dvmamem_map: size botch");
   1262        1.8       mrg #endif
   1263       1.58       chs 		addr = VM_PAGE_TO_PHYS(pg);
   1264       1.22       mrg 		DPRINTF(IDB_BUSDMA, ("iommu_dvmamem_map: "
   1265       1.25       mrg 		    "mapping va %lx at %llx\n", va, (unsigned long long)addr | cbit));
   1266       1.88    cegger 		pmap_kenter_pa(va, addr | cbit,
   1267       1.88    cegger 		    VM_PROT_READ | VM_PROT_WRITE, 0);
   1268        1.7       mrg 		va += PAGE_SIZE;
   1269        1.7       mrg 		size -= PAGE_SIZE;
   1270        1.7       mrg 	}
   1271       1.38     chris 	pmap_update(pmap_kernel());
   1272        1.7       mrg 	return (0);
   1273        1.7       mrg }
   1274        1.7       mrg 
   1275        1.7       mrg /*
   1276        1.7       mrg  * Unmap DVMA mappings from kernel
   1277        1.7       mrg  */
   1278        1.7       mrg void
   1279       1.85  nakayama iommu_dvmamem_unmap(bus_dma_tag_t t, void *kva, size_t size)
   1280        1.7       mrg {
   1281       1.58       chs 
   1282       1.22       mrg 	DPRINTF(IDB_BUSDMA, ("iommu_dvmamem_unmap: kvm %p size %lx\n",
   1283        1.7       mrg 	    kva, size));
   1284       1.58       chs 
   1285        1.7       mrg #ifdef DIAGNOSTIC
   1286        1.7       mrg 	if ((u_long)kva & PGOFSET)
   1287        1.7       mrg 		panic("iommu_dvmamem_unmap");
   1288        1.7       mrg #endif
   1289       1.58       chs 
   1290        1.7       mrg 	size = round_page(size);
   1291       1.58       chs 	pmap_kremove((vaddr_t)kva, size);
   1292       1.38     chris 	pmap_update(pmap_kernel());
   1293       1.76      yamt 	uvm_km_free(kernel_map, (vaddr_t)kva, size, UVM_KMF_VAONLY);
   1294        1.1       mrg }
   1295