Home | History | Annotate | Line # | Download | only in arm32
bus_dma.c revision 1.49
      1 /*	$NetBSD: bus_dma.c,v 1.49 2006/04/10 03:07:40 simonb Exp $	*/
      2 
      3 /*-
      4  * Copyright (c) 1996, 1997, 1998 The NetBSD Foundation, Inc.
      5  * All rights reserved.
      6  *
      7  * This code is derived from software contributed to The NetBSD Foundation
      8  * by Jason R. Thorpe of the Numerical Aerospace Simulation Facility,
      9  * NASA Ames Research Center.
     10  *
     11  * Redistribution and use in source and binary forms, with or without
     12  * modification, are permitted provided that the following conditions
     13  * are met:
     14  * 1. Redistributions of source code must retain the above copyright
     15  *    notice, this list of conditions and the following disclaimer.
     16  * 2. Redistributions in binary form must reproduce the above copyright
     17  *    notice, this list of conditions and the following disclaimer in the
     18  *    documentation and/or other materials provided with the distribution.
     19  * 3. All advertising materials mentioning features or use of this software
     20  *    must display the following acknowledgement:
     21  *	This product includes software developed by the NetBSD
     22  *	Foundation, Inc. and its contributors.
     23  * 4. Neither the name of The NetBSD Foundation nor the names of its
     24  *    contributors may be used to endorse or promote products derived
     25  *    from this software without specific prior written permission.
     26  *
     27  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     28  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     29  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     30  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     31  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     32  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     33  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     34  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     35  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     36  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     37  * POSSIBILITY OF SUCH DAMAGE.
     38  */
     39 
     40 #define _ARM32_BUS_DMA_PRIVATE
     41 
     42 #include <sys/cdefs.h>
     43 __KERNEL_RCSID(0, "$NetBSD: bus_dma.c,v 1.49 2006/04/10 03:07:40 simonb Exp $");
     44 
     45 #include <sys/param.h>
     46 #include <sys/systm.h>
     47 #include <sys/kernel.h>
     48 #include <sys/proc.h>
     49 #include <sys/buf.h>
     50 #include <sys/reboot.h>
     51 #include <sys/conf.h>
     52 #include <sys/file.h>
     53 #include <sys/malloc.h>
     54 #include <sys/mbuf.h>
     55 #include <sys/vnode.h>
     56 #include <sys/device.h>
     57 
     58 #include <uvm/uvm_extern.h>
     59 
     60 #include <machine/bus.h>
     61 #include <machine/cpu.h>
     62 
     63 #include <arm/cpufunc.h>
     64 
     65 int	_bus_dmamap_load_buffer(bus_dma_tag_t, bus_dmamap_t, void *,
     66 	    bus_size_t, struct vmspace *, int);
     67 struct arm32_dma_range *_bus_dma_inrange(struct arm32_dma_range *,
     68 	    int, bus_addr_t);
     69 
     70 /*
     71  * Check to see if the specified page is in an allowed DMA range.
     72  */
     73 inline struct arm32_dma_range *
     74 _bus_dma_inrange(struct arm32_dma_range *ranges, int nranges,
     75     bus_addr_t curaddr)
     76 {
     77 	struct arm32_dma_range *dr;
     78 	int i;
     79 
     80 	for (i = 0, dr = ranges; i < nranges; i++, dr++) {
     81 		if (curaddr >= dr->dr_sysbase &&
     82 		    round_page(curaddr) <= (dr->dr_sysbase + dr->dr_len))
     83 			return (dr);
     84 	}
     85 
     86 	return (NULL);
     87 }
     88 
     89 /*
     90  * Common function to load the specified physical address into the
     91  * DMA map, coalescing segments and boundary checking as necessary.
     92  */
     93 static int
     94 _bus_dmamap_load_paddr(bus_dma_tag_t t, bus_dmamap_t map,
     95     bus_addr_t paddr, bus_size_t size)
     96 {
     97 	bus_dma_segment_t * const segs = map->dm_segs;
     98 	int nseg = map->dm_nsegs;
     99 	bus_addr_t lastaddr = 0xdead;	/* XXX gcc */
    100 	bus_addr_t bmask = ~(map->_dm_boundary - 1);
    101 	bus_addr_t curaddr;
    102 	bus_size_t sgsize;
    103 
    104 	if (nseg > 0)
    105 		lastaddr = segs[nseg-1].ds_addr + segs[nseg-1].ds_len;
    106  again:
    107 	sgsize = size;
    108 
    109 	/* Make sure we're in an allowed DMA range. */
    110 	if (t->_ranges != NULL) {
    111 		/* XXX cache last result? */
    112 		const struct arm32_dma_range * const dr =
    113 		    _bus_dma_inrange(t->_ranges, t->_nranges, paddr);
    114 		if (dr == NULL)
    115 			return (EINVAL);
    116 
    117 		/*
    118 		 * In a valid DMA range.  Translate the physical
    119 		 * memory address to an address in the DMA window.
    120 		 */
    121 		curaddr = (paddr - dr->dr_sysbase) + dr->dr_busbase;
    122 	} else
    123 		curaddr = paddr;
    124 
    125 	/*
    126 	 * Make sure we don't cross any boundaries.
    127 	 */
    128 	if (map->_dm_boundary > 0) {
    129 		bus_addr_t baddr;	/* next boundary address */
    130 
    131 		baddr = (curaddr + map->_dm_boundary) & bmask;
    132 		if (sgsize > (baddr - curaddr))
    133 			sgsize = (baddr - curaddr);
    134 	}
    135 
    136 	/*
    137 	 * Insert chunk into a segment, coalescing with the
    138 	 * previous segment if possible.
    139 	 */
    140 	if (nseg > 0 && curaddr == lastaddr &&
    141 	    segs[nseg-1].ds_len + sgsize <= map->dm_maxsegsz &&
    142 	    (map->_dm_boundary == 0 ||
    143 	     (segs[nseg-1].ds_addr & bmask) == (curaddr & bmask))) {
    144 	     	/* coalesce */
    145 		segs[nseg-1].ds_len += sgsize;
    146 	} else if (nseg >= map->_dm_segcnt) {
    147 		return (EFBIG);
    148 	} else {
    149 		/* new segment */
    150 		segs[nseg].ds_addr = curaddr;
    151 		segs[nseg].ds_len = sgsize;
    152 		nseg++;
    153 	}
    154 
    155 	lastaddr = curaddr + sgsize;
    156 
    157 	paddr += sgsize;
    158 	size -= sgsize;
    159 	if (size > 0)
    160 		goto again;
    161 
    162 	map->dm_nsegs = nseg;
    163 	return (0);
    164 }
    165 
    166 /*
    167  * Common function for DMA map creation.  May be called by bus-specific
    168  * DMA map creation functions.
    169  */
    170 int
    171 _bus_dmamap_create(bus_dma_tag_t t, bus_size_t size, int nsegments,
    172     bus_size_t maxsegsz, bus_size_t boundary, int flags, bus_dmamap_t *dmamp)
    173 {
    174 	struct arm32_bus_dmamap *map;
    175 	void *mapstore;
    176 	size_t mapsize;
    177 
    178 #ifdef DEBUG_DMA
    179 	printf("dmamap_create: t=%p size=%lx nseg=%x msegsz=%lx boundary=%lx flags=%x\n",
    180 	    t, size, nsegments, maxsegsz, boundary, flags);
    181 #endif	/* DEBUG_DMA */
    182 
    183 	/*
    184 	 * Allocate and initialize the DMA map.  The end of the map
    185 	 * is a variable-sized array of segments, so we allocate enough
    186 	 * room for them in one shot.
    187 	 *
    188 	 * Note we don't preserve the WAITOK or NOWAIT flags.  Preservation
    189 	 * of ALLOCNOW notifies others that we've reserved these resources,
    190 	 * and they are not to be freed.
    191 	 *
    192 	 * The bus_dmamap_t includes one bus_dma_segment_t, hence
    193 	 * the (nsegments - 1).
    194 	 */
    195 	mapsize = sizeof(struct arm32_bus_dmamap) +
    196 	    (sizeof(bus_dma_segment_t) * (nsegments - 1));
    197 	if ((mapstore = malloc(mapsize, M_DMAMAP,
    198 	    (flags & BUS_DMA_NOWAIT) ? M_NOWAIT : M_WAITOK)) == NULL)
    199 		return (ENOMEM);
    200 
    201 	memset(mapstore, 0, mapsize);
    202 	map = (struct arm32_bus_dmamap *)mapstore;
    203 	map->_dm_size = size;
    204 	map->_dm_segcnt = nsegments;
    205 	map->_dm_maxmaxsegsz = maxsegsz;
    206 	map->_dm_boundary = boundary;
    207 	map->_dm_flags = flags & ~(BUS_DMA_WAITOK|BUS_DMA_NOWAIT);
    208 	map->_dm_origbuf = NULL;
    209 	map->_dm_buftype = ARM32_BUFTYPE_INVALID;
    210 	map->_dm_vmspace = vmspace_kernel();
    211 	map->dm_maxsegsz = maxsegsz;
    212 	map->dm_mapsize = 0;		/* no valid mappings */
    213 	map->dm_nsegs = 0;
    214 
    215 	*dmamp = map;
    216 #ifdef DEBUG_DMA
    217 	printf("dmamap_create:map=%p\n", map);
    218 #endif	/* DEBUG_DMA */
    219 	return (0);
    220 }
    221 
    222 /*
    223  * Common function for DMA map destruction.  May be called by bus-specific
    224  * DMA map destruction functions.
    225  */
    226 void
    227 _bus_dmamap_destroy(bus_dma_tag_t t, bus_dmamap_t map)
    228 {
    229 
    230 #ifdef DEBUG_DMA
    231 	printf("dmamap_destroy: t=%p map=%p\n", t, map);
    232 #endif	/* DEBUG_DMA */
    233 
    234 	/*
    235 	 * Explicit unload.
    236 	 */
    237 	map->dm_maxsegsz = map->_dm_maxmaxsegsz;
    238 	map->dm_mapsize = 0;
    239 	map->dm_nsegs = 0;
    240 	map->_dm_origbuf = NULL;
    241 	map->_dm_buftype = ARM32_BUFTYPE_INVALID;
    242 	map->_dm_vmspace = NULL;
    243 
    244 	free(map, M_DMAMAP);
    245 }
    246 
    247 /*
    248  * Common function for loading a DMA map with a linear buffer.  May
    249  * be called by bus-specific DMA map load functions.
    250  */
    251 int
    252 _bus_dmamap_load(bus_dma_tag_t t, bus_dmamap_t map, void *buf,
    253     bus_size_t buflen, struct proc *p, int flags)
    254 {
    255 	int error;
    256 	struct vmspace *vm;
    257 
    258 #ifdef DEBUG_DMA
    259 	printf("dmamap_load: t=%p map=%p buf=%p len=%lx p=%p f=%d\n",
    260 	    t, map, buf, buflen, p, flags);
    261 #endif	/* DEBUG_DMA */
    262 
    263 	/*
    264 	 * Make sure that on error condition we return "no valid mappings".
    265 	 */
    266 	map->dm_mapsize = 0;
    267 	map->dm_nsegs = 0;
    268 	KASSERT(map->dm_maxsegsz <= map->_dm_maxmaxsegsz);
    269 
    270 	if (buflen > map->_dm_size)
    271 		return (EINVAL);
    272 
    273 	if (p != NULL) {
    274 		vm = p->p_vmspace;
    275 	} else {
    276 		vm = vmspace_kernel();
    277 	}
    278 
    279 	/* _bus_dmamap_load_buffer() clears this if we're not... */
    280 	map->_dm_flags |= ARM32_DMAMAP_COHERENT;
    281 
    282 	error = _bus_dmamap_load_buffer(t, map, buf, buflen, vm, flags);
    283 	if (error == 0) {
    284 		map->dm_mapsize = buflen;
    285 		map->_dm_origbuf = buf;
    286 		map->_dm_buftype = ARM32_BUFTYPE_LINEAR;
    287 		map->_dm_vmspace = vm;
    288 	}
    289 #ifdef DEBUG_DMA
    290 	printf("dmamap_load: error=%d\n", error);
    291 #endif	/* DEBUG_DMA */
    292 	return (error);
    293 }
    294 
    295 /*
    296  * Like _bus_dmamap_load(), but for mbufs.
    297  */
    298 int
    299 _bus_dmamap_load_mbuf(bus_dma_tag_t t, bus_dmamap_t map, struct mbuf *m0,
    300     int flags)
    301 {
    302 	int error;
    303 	struct mbuf *m;
    304 
    305 #ifdef DEBUG_DMA
    306 	printf("dmamap_load_mbuf: t=%p map=%p m0=%p f=%d\n",
    307 	    t, map, m0, flags);
    308 #endif	/* DEBUG_DMA */
    309 
    310 	/*
    311 	 * Make sure that on error condition we return "no valid mappings."
    312 	 */
    313 	map->dm_mapsize = 0;
    314 	map->dm_nsegs = 0;
    315 	KASSERT(map->dm_maxsegsz <= map->_dm_maxmaxsegsz);
    316 
    317 #ifdef DIAGNOSTIC
    318 	if ((m0->m_flags & M_PKTHDR) == 0)
    319 		panic("_bus_dmamap_load_mbuf: no packet header");
    320 #endif	/* DIAGNOSTIC */
    321 
    322 	if (m0->m_pkthdr.len > map->_dm_size)
    323 		return (EINVAL);
    324 
    325 	/*
    326 	 * Mbuf chains should almost never have coherent (i.e.
    327 	 * un-cached) mappings, so clear that flag now.
    328 	 */
    329 	map->_dm_flags &= ~ARM32_DMAMAP_COHERENT;
    330 
    331 	error = 0;
    332 	for (m = m0; m != NULL && error == 0; m = m->m_next) {
    333 		int offset;
    334 		int remainbytes;
    335 		const struct vm_page * const *pgs;
    336 		paddr_t paddr;
    337 		int size;
    338 
    339 		if (m->m_len == 0)
    340 			continue;
    341 		switch (m->m_flags & (M_EXT|M_CLUSTER|M_EXT_PAGES)) {
    342 		case M_EXT|M_CLUSTER:
    343 			/* XXX KDASSERT */
    344 			KASSERT(m->m_ext.ext_paddr != M_PADDR_INVALID);
    345 			paddr = m->m_ext.ext_paddr +
    346 			    (m->m_data - m->m_ext.ext_buf);
    347 			size = m->m_len;
    348 			error = _bus_dmamap_load_paddr(t, map, paddr, size);
    349 			break;
    350 
    351 		case M_EXT|M_EXT_PAGES:
    352 			KASSERT(m->m_ext.ext_buf <= m->m_data);
    353 			KASSERT(m->m_data <=
    354 			    m->m_ext.ext_buf + m->m_ext.ext_size);
    355 
    356 			offset = (vaddr_t)m->m_data -
    357 			    trunc_page((vaddr_t)m->m_ext.ext_buf);
    358 			remainbytes = m->m_len;
    359 
    360 			/* skip uninteresting pages */
    361 			pgs = (const struct vm_page * const *)
    362 			    m->m_ext.ext_pgs + (offset >> PAGE_SHIFT);
    363 
    364 			offset &= PAGE_MASK;	/* offset in the first page */
    365 
    366 			/* load each page */
    367 			while (remainbytes > 0) {
    368 				const struct vm_page *pg;
    369 
    370 				size = MIN(remainbytes, PAGE_SIZE - offset);
    371 
    372 				pg = *pgs++;
    373 				KASSERT(pg);
    374 				paddr = VM_PAGE_TO_PHYS(pg) + offset;
    375 
    376 				error = _bus_dmamap_load_paddr(t, map,
    377 				    paddr, size);
    378 				if (error)
    379 					break;
    380 				offset = 0;
    381 				remainbytes -= size;
    382 			}
    383 			break;
    384 
    385 		case 0:
    386 			paddr = m->m_paddr + M_BUFOFFSET(m) +
    387 			    (m->m_data - M_BUFADDR(m));
    388 			size = m->m_len;
    389 			error = _bus_dmamap_load_paddr(t, map, paddr, size);
    390 			break;
    391 
    392 		default:
    393 			error = _bus_dmamap_load_buffer(t, map, m->m_data,
    394 			    m->m_len, vmspace_kernel(), flags);
    395 		}
    396 	}
    397 	if (error == 0) {
    398 		map->dm_mapsize = m0->m_pkthdr.len;
    399 		map->_dm_origbuf = m0;
    400 		map->_dm_buftype = ARM32_BUFTYPE_MBUF;
    401 		map->_dm_vmspace = vmspace_kernel();	/* always kernel */
    402 	}
    403 #ifdef DEBUG_DMA
    404 	printf("dmamap_load_mbuf: error=%d\n", error);
    405 #endif	/* DEBUG_DMA */
    406 	return (error);
    407 }
    408 
    409 /*
    410  * Like _bus_dmamap_load(), but for uios.
    411  */
    412 int
    413 _bus_dmamap_load_uio(bus_dma_tag_t t, bus_dmamap_t map, struct uio *uio,
    414     int flags)
    415 {
    416 	int i, error;
    417 	bus_size_t minlen, resid;
    418 	struct iovec *iov;
    419 	caddr_t addr;
    420 
    421 	/*
    422 	 * Make sure that on error condition we return "no valid mappings."
    423 	 */
    424 	map->dm_mapsize = 0;
    425 	map->dm_nsegs = 0;
    426 	KASSERT(map->dm_maxsegsz <= map->_dm_maxmaxsegsz);
    427 
    428 	resid = uio->uio_resid;
    429 	iov = uio->uio_iov;
    430 
    431 	/* _bus_dmamap_load_buffer() clears this if we're not... */
    432 	map->_dm_flags |= ARM32_DMAMAP_COHERENT;
    433 
    434 	error = 0;
    435 	for (i = 0; i < uio->uio_iovcnt && resid != 0 && error == 0; i++) {
    436 		/*
    437 		 * Now at the first iovec to load.  Load each iovec
    438 		 * until we have exhausted the residual count.
    439 		 */
    440 		minlen = resid < iov[i].iov_len ? resid : iov[i].iov_len;
    441 		addr = (caddr_t)iov[i].iov_base;
    442 
    443 		error = _bus_dmamap_load_buffer(t, map, addr, minlen,
    444 		    uio->uio_vmspace, flags);
    445 
    446 		resid -= minlen;
    447 	}
    448 	if (error == 0) {
    449 		map->dm_mapsize = uio->uio_resid;
    450 		map->_dm_origbuf = uio;
    451 		map->_dm_buftype = ARM32_BUFTYPE_UIO;
    452 		map->_dm_vmspace = uio->uio_vmspace;
    453 	}
    454 	return (error);
    455 }
    456 
    457 /*
    458  * Like _bus_dmamap_load(), but for raw memory allocated with
    459  * bus_dmamem_alloc().
    460  */
    461 int
    462 _bus_dmamap_load_raw(bus_dma_tag_t t, bus_dmamap_t map,
    463     bus_dma_segment_t *segs, int nsegs, bus_size_t size, int flags)
    464 {
    465 
    466 	panic("_bus_dmamap_load_raw: not implemented");
    467 }
    468 
    469 /*
    470  * Common function for unloading a DMA map.  May be called by
    471  * bus-specific DMA map unload functions.
    472  */
    473 void
    474 _bus_dmamap_unload(bus_dma_tag_t t, bus_dmamap_t map)
    475 {
    476 
    477 #ifdef DEBUG_DMA
    478 	printf("dmamap_unload: t=%p map=%p\n", t, map);
    479 #endif	/* DEBUG_DMA */
    480 
    481 	/*
    482 	 * No resources to free; just mark the mappings as
    483 	 * invalid.
    484 	 */
    485 	map->dm_mapsize = 0;
    486 	map->dm_nsegs = 0;
    487 	map->_dm_origbuf = NULL;
    488 	map->_dm_buftype = ARM32_BUFTYPE_INVALID;
    489 	map->_dm_vmspace = NULL;
    490 }
    491 
    492 static inline void
    493 _bus_dmamap_sync_linear(bus_dma_tag_t t, bus_dmamap_t map, bus_addr_t offset,
    494     bus_size_t len, int ops)
    495 {
    496 	vaddr_t addr = (vaddr_t) map->_dm_origbuf;
    497 
    498 	addr += offset;
    499 
    500 	switch (ops) {
    501 	case BUS_DMASYNC_PREREAD|BUS_DMASYNC_PREWRITE:
    502 		cpu_dcache_wbinv_range(addr, len);
    503 		break;
    504 
    505 	case BUS_DMASYNC_PREREAD:
    506 		if (((addr | len) & arm_dcache_align_mask) == 0)
    507 			cpu_dcache_inv_range(addr, len);
    508 		else
    509 			cpu_dcache_wbinv_range(addr, len);
    510 		break;
    511 
    512 	case BUS_DMASYNC_PREWRITE:
    513 		cpu_dcache_wb_range(addr, len);
    514 		break;
    515 	}
    516 }
    517 
    518 static inline void
    519 _bus_dmamap_sync_mbuf(bus_dma_tag_t t, bus_dmamap_t map, bus_addr_t offset,
    520     bus_size_t len, int ops)
    521 {
    522 	struct mbuf *m, *m0 = map->_dm_origbuf;
    523 	bus_size_t minlen, moff;
    524 	vaddr_t maddr;
    525 
    526 	for (moff = offset, m = m0; m != NULL && len != 0; m = m->m_next) {
    527 		/* Find the beginning mbuf. */
    528 		if (moff >= m->m_len) {
    529 			moff -= m->m_len;
    530 			continue;
    531 		}
    532 
    533 		/*
    534 		 * Now at the first mbuf to sync; nail each one until
    535 		 * we have exhausted the length.
    536 		 */
    537 		minlen = m->m_len - moff;
    538 		if (len < minlen)
    539 			minlen = len;
    540 
    541 		maddr = mtod(m, vaddr_t);
    542 		maddr += moff;
    543 
    544 		/*
    545 		 * We can save a lot of work here if we know the mapping
    546 		 * is read-only at the MMU:
    547 		 *
    548 		 * If a mapping is read-only, no dirty cache blocks will
    549 		 * exist for it.  If a writable mapping was made read-only,
    550 		 * we know any dirty cache lines for the range will have
    551 		 * been cleaned for us already.  Therefore, if the upper
    552 		 * layer can tell us we have a read-only mapping, we can
    553 		 * skip all cache cleaning.
    554 		 *
    555 		 * NOTE: This only works if we know the pmap cleans pages
    556 		 * before making a read-write -> read-only transition.  If
    557 		 * this ever becomes non-true (e.g. Physically Indexed
    558 		 * cache), this will have to be revisited.
    559 		 */
    560 		switch (ops) {
    561 		case BUS_DMASYNC_PREREAD|BUS_DMASYNC_PREWRITE:
    562 			if (! M_ROMAP(m)) {
    563 				cpu_dcache_wbinv_range(maddr, minlen);
    564 				break;
    565 			}
    566 			/* else FALLTHROUGH */
    567 
    568 		case BUS_DMASYNC_PREREAD:
    569 			if (((maddr | minlen) & arm_dcache_align_mask) == 0)
    570 				cpu_dcache_inv_range(maddr, minlen);
    571 			else
    572 				cpu_dcache_wbinv_range(maddr, minlen);
    573 			break;
    574 
    575 		case BUS_DMASYNC_PREWRITE:
    576 			if (! M_ROMAP(m))
    577 				cpu_dcache_wb_range(maddr, minlen);
    578 			break;
    579 		}
    580 		moff = 0;
    581 		len -= minlen;
    582 	}
    583 }
    584 
    585 static inline void
    586 _bus_dmamap_sync_uio(bus_dma_tag_t t, bus_dmamap_t map, bus_addr_t offset,
    587     bus_size_t len, int ops)
    588 {
    589 	struct uio *uio = map->_dm_origbuf;
    590 	struct iovec *iov;
    591 	bus_size_t minlen, ioff;
    592 	vaddr_t addr;
    593 
    594 	for (iov = uio->uio_iov, ioff = offset; len != 0; iov++) {
    595 		/* Find the beginning iovec. */
    596 		if (ioff >= iov->iov_len) {
    597 			ioff -= iov->iov_len;
    598 			continue;
    599 		}
    600 
    601 		/*
    602 		 * Now at the first iovec to sync; nail each one until
    603 		 * we have exhausted the length.
    604 		 */
    605 		minlen = iov->iov_len - ioff;
    606 		if (len < minlen)
    607 			minlen = len;
    608 
    609 		addr = (vaddr_t) iov->iov_base;
    610 		addr += ioff;
    611 
    612 		switch (ops) {
    613 		case BUS_DMASYNC_PREREAD|BUS_DMASYNC_PREWRITE:
    614 			cpu_dcache_wbinv_range(addr, minlen);
    615 			break;
    616 
    617 		case BUS_DMASYNC_PREREAD:
    618 			if (((addr | minlen) & arm_dcache_align_mask) == 0)
    619 				cpu_dcache_inv_range(addr, minlen);
    620 			else
    621 				cpu_dcache_wbinv_range(addr, minlen);
    622 			break;
    623 
    624 		case BUS_DMASYNC_PREWRITE:
    625 			cpu_dcache_wb_range(addr, minlen);
    626 			break;
    627 		}
    628 		ioff = 0;
    629 		len -= minlen;
    630 	}
    631 }
    632 
    633 /*
    634  * Common function for DMA map synchronization.  May be called
    635  * by bus-specific DMA map synchronization functions.
    636  *
    637  * This version works for the Virtually Indexed Virtually Tagged
    638  * cache found on 32-bit ARM processors.
    639  *
    640  * XXX Should have separate versions for write-through vs.
    641  * XXX write-back caches.  We currently assume write-back
    642  * XXX here, which is not as efficient as it could be for
    643  * XXX the write-through case.
    644  */
    645 void
    646 _bus_dmamap_sync(bus_dma_tag_t t, bus_dmamap_t map, bus_addr_t offset,
    647     bus_size_t len, int ops)
    648 {
    649 
    650 #ifdef DEBUG_DMA
    651 	printf("dmamap_sync: t=%p map=%p offset=%lx len=%lx ops=%x\n",
    652 	    t, map, offset, len, ops);
    653 #endif	/* DEBUG_DMA */
    654 
    655 	/*
    656 	 * Mixing of PRE and POST operations is not allowed.
    657 	 */
    658 	if ((ops & (BUS_DMASYNC_PREREAD|BUS_DMASYNC_PREWRITE)) != 0 &&
    659 	    (ops & (BUS_DMASYNC_POSTREAD|BUS_DMASYNC_POSTWRITE)) != 0)
    660 		panic("_bus_dmamap_sync: mix PRE and POST");
    661 
    662 #ifdef DIAGNOSTIC
    663 	if (offset >= map->dm_mapsize)
    664 		panic("_bus_dmamap_sync: bad offset %lu (map size is %lu)",
    665 		    offset, map->dm_mapsize);
    666 	if (len == 0 || (offset + len) > map->dm_mapsize)
    667 		panic("_bus_dmamap_sync: bad length");
    668 #endif
    669 
    670 	/*
    671 	 * For a virtually-indexed write-back cache, we need
    672 	 * to do the following things:
    673 	 *
    674 	 *	PREREAD -- Invalidate the D-cache.  We do this
    675 	 *	here in case a write-back is required by the back-end.
    676 	 *
    677 	 *	PREWRITE -- Write-back the D-cache.  Note that if
    678 	 *	we are doing a PREREAD|PREWRITE, we can collapse
    679 	 *	the whole thing into a single Wb-Inv.
    680 	 *
    681 	 *	POSTREAD -- Nothing.
    682 	 *
    683 	 *	POSTWRITE -- Nothing.
    684 	 */
    685 
    686 	ops &= (BUS_DMASYNC_PREREAD|BUS_DMASYNC_PREWRITE);
    687 	if (ops == 0)
    688 		return;
    689 
    690 	/* Skip cache frobbing if mapping was COHERENT. */
    691 	if (map->_dm_flags & ARM32_DMAMAP_COHERENT) {
    692 		/* Drain the write buffer. */
    693 		cpu_drain_writebuf();
    694 		return;
    695 	}
    696 
    697 	/*
    698 	 * If the mapping belongs to a non-kernel vmspace, and the
    699 	 * vmspace has not been active since the last time a full
    700 	 * cache flush was performed, we don't need to do anything.
    701 	 */
    702 	if (__predict_false(!VMSPACE_IS_KERNEL_P(map->_dm_vmspace) &&
    703 	    vm_map_pmap(&map->_dm_vmspace->vm_map)->pm_cstate.cs_cache_d == 0))
    704 		return;
    705 
    706 	switch (map->_dm_buftype) {
    707 	case ARM32_BUFTYPE_LINEAR:
    708 		_bus_dmamap_sync_linear(t, map, offset, len, ops);
    709 		break;
    710 
    711 	case ARM32_BUFTYPE_MBUF:
    712 		_bus_dmamap_sync_mbuf(t, map, offset, len, ops);
    713 		break;
    714 
    715 	case ARM32_BUFTYPE_UIO:
    716 		_bus_dmamap_sync_uio(t, map, offset, len, ops);
    717 		break;
    718 
    719 	case ARM32_BUFTYPE_RAW:
    720 		panic("_bus_dmamap_sync: ARM32_BUFTYPE_RAW");
    721 		break;
    722 
    723 	case ARM32_BUFTYPE_INVALID:
    724 		panic("_bus_dmamap_sync: ARM32_BUFTYPE_INVALID");
    725 		break;
    726 
    727 	default:
    728 		printf("unknown buffer type %d\n", map->_dm_buftype);
    729 		panic("_bus_dmamap_sync");
    730 	}
    731 
    732 	/* Drain the write buffer. */
    733 	cpu_drain_writebuf();
    734 }
    735 
    736 /*
    737  * Common function for DMA-safe memory allocation.  May be called
    738  * by bus-specific DMA memory allocation functions.
    739  */
    740 
    741 extern paddr_t physical_start;
    742 extern paddr_t physical_end;
    743 
    744 int
    745 _bus_dmamem_alloc(bus_dma_tag_t t, bus_size_t size, bus_size_t alignment,
    746     bus_size_t boundary, bus_dma_segment_t *segs, int nsegs, int *rsegs,
    747     int flags)
    748 {
    749 	struct arm32_dma_range *dr;
    750 	int error, i;
    751 
    752 #ifdef DEBUG_DMA
    753 	printf("dmamem_alloc t=%p size=%lx align=%lx boundary=%lx "
    754 	    "segs=%p nsegs=%x rsegs=%p flags=%x\n", t, size, alignment,
    755 	    boundary, segs, nsegs, rsegs, flags);
    756 #endif
    757 
    758 	if ((dr = t->_ranges) != NULL) {
    759 		error = ENOMEM;
    760 		for (i = 0; i < t->_nranges; i++, dr++) {
    761 			if (dr->dr_len == 0)
    762 				continue;
    763 			error = _bus_dmamem_alloc_range(t, size, alignment,
    764 			    boundary, segs, nsegs, rsegs, flags,
    765 			    trunc_page(dr->dr_sysbase),
    766 			    trunc_page(dr->dr_sysbase + dr->dr_len));
    767 			if (error == 0)
    768 				break;
    769 		}
    770 	} else {
    771 		error = _bus_dmamem_alloc_range(t, size, alignment, boundary,
    772 		    segs, nsegs, rsegs, flags, trunc_page(physical_start),
    773 		    trunc_page(physical_end));
    774 	}
    775 
    776 #ifdef DEBUG_DMA
    777 	printf("dmamem_alloc: =%d\n", error);
    778 #endif
    779 
    780 	return(error);
    781 }
    782 
    783 /*
    784  * Common function for freeing DMA-safe memory.  May be called by
    785  * bus-specific DMA memory free functions.
    786  */
    787 void
    788 _bus_dmamem_free(bus_dma_tag_t t, bus_dma_segment_t *segs, int nsegs)
    789 {
    790 	struct vm_page *m;
    791 	bus_addr_t addr;
    792 	struct pglist mlist;
    793 	int curseg;
    794 
    795 #ifdef DEBUG_DMA
    796 	printf("dmamem_free: t=%p segs=%p nsegs=%x\n", t, segs, nsegs);
    797 #endif	/* DEBUG_DMA */
    798 
    799 	/*
    800 	 * Build a list of pages to free back to the VM system.
    801 	 */
    802 	TAILQ_INIT(&mlist);
    803 	for (curseg = 0; curseg < nsegs; curseg++) {
    804 		for (addr = segs[curseg].ds_addr;
    805 		    addr < (segs[curseg].ds_addr + segs[curseg].ds_len);
    806 		    addr += PAGE_SIZE) {
    807 			m = PHYS_TO_VM_PAGE(addr);
    808 			TAILQ_INSERT_TAIL(&mlist, m, pageq);
    809 		}
    810 	}
    811 	uvm_pglistfree(&mlist);
    812 }
    813 
    814 /*
    815  * Common function for mapping DMA-safe memory.  May be called by
    816  * bus-specific DMA memory map functions.
    817  */
    818 int
    819 _bus_dmamem_map(bus_dma_tag_t t, bus_dma_segment_t *segs, int nsegs,
    820     size_t size, caddr_t *kvap, int flags)
    821 {
    822 	vaddr_t va;
    823 	bus_addr_t addr;
    824 	int curseg;
    825 	pt_entry_t *ptep/*, pte*/;
    826 	const uvm_flag_t kmflags =
    827 	    (flags & BUS_DMA_NOWAIT) != 0 ? UVM_KMF_NOWAIT : 0;
    828 
    829 #ifdef DEBUG_DMA
    830 	printf("dmamem_map: t=%p segs=%p nsegs=%x size=%lx flags=%x\n", t,
    831 	    segs, nsegs, (unsigned long)size, flags);
    832 #endif	/* DEBUG_DMA */
    833 
    834 	size = round_page(size);
    835 	va = uvm_km_alloc(kernel_map, size, 0, UVM_KMF_VAONLY | kmflags);
    836 
    837 	if (va == 0)
    838 		return (ENOMEM);
    839 
    840 	*kvap = (caddr_t)va;
    841 
    842 	for (curseg = 0; curseg < nsegs; curseg++) {
    843 		for (addr = segs[curseg].ds_addr;
    844 		    addr < (segs[curseg].ds_addr + segs[curseg].ds_len);
    845 		    addr += PAGE_SIZE, va += PAGE_SIZE, size -= PAGE_SIZE) {
    846 #ifdef DEBUG_DMA
    847 			printf("wiring p%lx to v%lx", addr, va);
    848 #endif	/* DEBUG_DMA */
    849 			if (size == 0)
    850 				panic("_bus_dmamem_map: size botch");
    851 			pmap_enter(pmap_kernel(), va, addr,
    852 			    VM_PROT_READ | VM_PROT_WRITE,
    853 			    VM_PROT_READ | VM_PROT_WRITE | PMAP_WIRED);
    854 			/*
    855 			 * If the memory must remain coherent with the
    856 			 * cache then we must make the memory uncacheable
    857 			 * in order to maintain virtual cache coherency.
    858 			 * We must also guarantee the cache does not already
    859 			 * contain the virtal addresses we are making
    860 			 * uncacheable.
    861 			 */
    862 			if (flags & BUS_DMA_COHERENT) {
    863 				cpu_dcache_wbinv_range(va, PAGE_SIZE);
    864 				cpu_drain_writebuf();
    865 				ptep = vtopte(va);
    866 				*ptep &= ~L2_S_CACHE_MASK;
    867 				PTE_SYNC(ptep);
    868 				tlb_flush();
    869 			}
    870 #ifdef DEBUG_DMA
    871 			ptep = vtopte(va);
    872 			printf(" pte=v%p *pte=%x\n", ptep, *ptep);
    873 #endif	/* DEBUG_DMA */
    874 		}
    875 	}
    876 	pmap_update(pmap_kernel());
    877 #ifdef DEBUG_DMA
    878 	printf("dmamem_map: =%p\n", *kvap);
    879 #endif	/* DEBUG_DMA */
    880 	return (0);
    881 }
    882 
    883 /*
    884  * Common function for unmapping DMA-safe memory.  May be called by
    885  * bus-specific DMA memory unmapping functions.
    886  */
    887 void
    888 _bus_dmamem_unmap(bus_dma_tag_t t, caddr_t kva, size_t size)
    889 {
    890 
    891 #ifdef DEBUG_DMA
    892 	printf("dmamem_unmap: t=%p kva=%p size=%lx\n", t, kva,
    893 	    (unsigned long)size);
    894 #endif	/* DEBUG_DMA */
    895 #ifdef DIAGNOSTIC
    896 	if ((u_long)kva & PGOFSET)
    897 		panic("_bus_dmamem_unmap");
    898 #endif	/* DIAGNOSTIC */
    899 
    900 	size = round_page(size);
    901 	pmap_remove(pmap_kernel(), (vaddr_t)kva, (vaddr_t)kva + size);
    902 	pmap_update(pmap_kernel());
    903 	uvm_km_free(kernel_map, (vaddr_t)kva, size, UVM_KMF_VAONLY);
    904 }
    905 
    906 /*
    907  * Common functin for mmap(2)'ing DMA-safe memory.  May be called by
    908  * bus-specific DMA mmap(2)'ing functions.
    909  */
    910 paddr_t
    911 _bus_dmamem_mmap(bus_dma_tag_t t, bus_dma_segment_t *segs, int nsegs,
    912     off_t off, int prot, int flags)
    913 {
    914 	int i;
    915 
    916 	for (i = 0; i < nsegs; i++) {
    917 #ifdef DIAGNOSTIC
    918 		if (off & PGOFSET)
    919 			panic("_bus_dmamem_mmap: offset unaligned");
    920 		if (segs[i].ds_addr & PGOFSET)
    921 			panic("_bus_dmamem_mmap: segment unaligned");
    922 		if (segs[i].ds_len & PGOFSET)
    923 			panic("_bus_dmamem_mmap: segment size not multiple"
    924 			    " of page size");
    925 #endif	/* DIAGNOSTIC */
    926 		if (off >= segs[i].ds_len) {
    927 			off -= segs[i].ds_len;
    928 			continue;
    929 		}
    930 
    931 		return (arm_btop((u_long)segs[i].ds_addr + off));
    932 	}
    933 
    934 	/* Page not found. */
    935 	return (-1);
    936 }
    937 
    938 /**********************************************************************
    939  * DMA utility functions
    940  **********************************************************************/
    941 
    942 /*
    943  * Utility function to load a linear buffer.  lastaddrp holds state
    944  * between invocations (for multiple-buffer loads).  segp contains
    945  * the starting segment on entrace, and the ending segment on exit.
    946  * first indicates if this is the first invocation of this function.
    947  */
    948 int
    949 _bus_dmamap_load_buffer(bus_dma_tag_t t, bus_dmamap_t map, void *buf,
    950     bus_size_t buflen, struct vmspace *vm, int flags)
    951 {
    952 	bus_size_t sgsize;
    953 	bus_addr_t curaddr;
    954 	vaddr_t vaddr = (vaddr_t)buf;
    955 	pd_entry_t *pde;
    956 	pt_entry_t pte;
    957 	int error;
    958 	pmap_t pmap;
    959 	pt_entry_t *ptep;
    960 
    961 #ifdef DEBUG_DMA
    962 	printf("_bus_dmamem_load_buffer(buf=%p, len=%lx, flags=%d)\n",
    963 	    buf, buflen, flags);
    964 #endif	/* DEBUG_DMA */
    965 
    966 	pmap = vm_map_pmap(&vm->vm_map);
    967 
    968 	while (buflen > 0) {
    969 		/*
    970 		 * Get the physical address for this segment.
    971 		 *
    972 		 * XXX Don't support checking for coherent mappings
    973 		 * XXX in user address space.
    974 		 */
    975 		if (__predict_true(pmap == pmap_kernel())) {
    976 			(void) pmap_get_pde_pte(pmap, vaddr, &pde, &ptep);
    977 			if (__predict_false(pmap_pde_section(pde))) {
    978 				curaddr = (*pde & L1_S_FRAME) |
    979 				    (vaddr & L1_S_OFFSET);
    980 				if (*pde & L1_S_CACHE_MASK) {
    981 					map->_dm_flags &=
    982 					    ~ARM32_DMAMAP_COHERENT;
    983 				}
    984 			} else {
    985 				pte = *ptep;
    986 				KDASSERT((pte & L2_TYPE_MASK) != L2_TYPE_INV);
    987 				if (__predict_false((pte & L2_TYPE_MASK)
    988 						    == L2_TYPE_L)) {
    989 					curaddr = (pte & L2_L_FRAME) |
    990 					    (vaddr & L2_L_OFFSET);
    991 					if (pte & L2_L_CACHE_MASK) {
    992 						map->_dm_flags &=
    993 						    ~ARM32_DMAMAP_COHERENT;
    994 					}
    995 				} else {
    996 					curaddr = (pte & L2_S_FRAME) |
    997 					    (vaddr & L2_S_OFFSET);
    998 					if (pte & L2_S_CACHE_MASK) {
    999 						map->_dm_flags &=
   1000 						    ~ARM32_DMAMAP_COHERENT;
   1001 					}
   1002 				}
   1003 			}
   1004 		} else {
   1005 			(void) pmap_extract(pmap, vaddr, &curaddr);
   1006 			map->_dm_flags &= ~ARM32_DMAMAP_COHERENT;
   1007 		}
   1008 
   1009 		/*
   1010 		 * Compute the segment size, and adjust counts.
   1011 		 */
   1012 		sgsize = PAGE_SIZE - ((u_long)vaddr & PGOFSET);
   1013 		if (buflen < sgsize)
   1014 			sgsize = buflen;
   1015 
   1016 		error = _bus_dmamap_load_paddr(t, map, curaddr, sgsize);
   1017 		if (error)
   1018 			return (error);
   1019 
   1020 		vaddr += sgsize;
   1021 		buflen -= sgsize;
   1022 	}
   1023 
   1024 	return (0);
   1025 }
   1026 
   1027 /*
   1028  * Allocate physical memory from the given physical address range.
   1029  * Called by DMA-safe memory allocation methods.
   1030  */
   1031 int
   1032 _bus_dmamem_alloc_range(bus_dma_tag_t t, bus_size_t size, bus_size_t alignment,
   1033     bus_size_t boundary, bus_dma_segment_t *segs, int nsegs, int *rsegs,
   1034     int flags, paddr_t low, paddr_t high)
   1035 {
   1036 	paddr_t curaddr, lastaddr;
   1037 	struct vm_page *m;
   1038 	struct pglist mlist;
   1039 	int curseg, error;
   1040 
   1041 #ifdef DEBUG_DMA
   1042 	printf("alloc_range: t=%p size=%lx align=%lx boundary=%lx segs=%p nsegs=%x rsegs=%p flags=%x lo=%lx hi=%lx\n",
   1043 	    t, size, alignment, boundary, segs, nsegs, rsegs, flags, low, high);
   1044 #endif	/* DEBUG_DMA */
   1045 
   1046 	/* Always round the size. */
   1047 	size = round_page(size);
   1048 
   1049 	/*
   1050 	 * Allocate pages from the VM system.
   1051 	 */
   1052 	error = uvm_pglistalloc(size, low, high, alignment, boundary,
   1053 	    &mlist, nsegs, (flags & BUS_DMA_NOWAIT) == 0);
   1054 	if (error)
   1055 		return (error);
   1056 
   1057 	/*
   1058 	 * Compute the location, size, and number of segments actually
   1059 	 * returned by the VM code.
   1060 	 */
   1061 	m = TAILQ_FIRST(&mlist);
   1062 	curseg = 0;
   1063 	lastaddr = segs[curseg].ds_addr = VM_PAGE_TO_PHYS(m);
   1064 	segs[curseg].ds_len = PAGE_SIZE;
   1065 #ifdef DEBUG_DMA
   1066 		printf("alloc: page %lx\n", lastaddr);
   1067 #endif	/* DEBUG_DMA */
   1068 	m = TAILQ_NEXT(m, pageq);
   1069 
   1070 	for (; m != NULL; m = TAILQ_NEXT(m, pageq)) {
   1071 		curaddr = VM_PAGE_TO_PHYS(m);
   1072 #ifdef DIAGNOSTIC
   1073 		if (curaddr < low || curaddr >= high) {
   1074 			printf("uvm_pglistalloc returned non-sensical"
   1075 			    " address 0x%lx\n", curaddr);
   1076 			panic("_bus_dmamem_alloc_range");
   1077 		}
   1078 #endif	/* DIAGNOSTIC */
   1079 #ifdef DEBUG_DMA
   1080 		printf("alloc: page %lx\n", curaddr);
   1081 #endif	/* DEBUG_DMA */
   1082 		if (curaddr == (lastaddr + PAGE_SIZE))
   1083 			segs[curseg].ds_len += PAGE_SIZE;
   1084 		else {
   1085 			curseg++;
   1086 			segs[curseg].ds_addr = curaddr;
   1087 			segs[curseg].ds_len = PAGE_SIZE;
   1088 		}
   1089 		lastaddr = curaddr;
   1090 	}
   1091 
   1092 	*rsegs = curseg + 1;
   1093 
   1094 	return (0);
   1095 }
   1096 
   1097 /*
   1098  * Check if a memory region intersects with a DMA range, and return the
   1099  * page-rounded intersection if it does.
   1100  */
   1101 int
   1102 arm32_dma_range_intersect(struct arm32_dma_range *ranges, int nranges,
   1103     paddr_t pa, psize_t size, paddr_t *pap, psize_t *sizep)
   1104 {
   1105 	struct arm32_dma_range *dr;
   1106 	int i;
   1107 
   1108 	if (ranges == NULL)
   1109 		return (0);
   1110 
   1111 	for (i = 0, dr = ranges; i < nranges; i++, dr++) {
   1112 		if (dr->dr_sysbase <= pa &&
   1113 		    pa < (dr->dr_sysbase + dr->dr_len)) {
   1114 			/*
   1115 			 * Beginning of region intersects with this range.
   1116 			 */
   1117 			*pap = trunc_page(pa);
   1118 			*sizep = round_page(min(pa + size,
   1119 			    dr->dr_sysbase + dr->dr_len) - pa);
   1120 			return (1);
   1121 		}
   1122 		if (pa < dr->dr_sysbase && dr->dr_sysbase < (pa + size)) {
   1123 			/*
   1124 			 * End of region intersects with this range.
   1125 			 */
   1126 			*pap = trunc_page(dr->dr_sysbase);
   1127 			*sizep = round_page(min((pa + size) - dr->dr_sysbase,
   1128 			    dr->dr_len));
   1129 			return (1);
   1130 		}
   1131 	}
   1132 
   1133 	/* No intersection found. */
   1134 	return (0);
   1135 }
   1136